diff --git a/.env b/.env index 34d98ba..77707d6 100644 --- a/.env +++ b/.env @@ -8,3 +8,5 @@ DATABASE_URL="file:./dev.db" CHROMA_PORT=5666 CHROMA_ENDPOINT=http://localhost:${CHROMA_PORT} CHROME_PERSIST_DIRECTORY=./chroma +EMBEDDING_MODEL=mxbai-embed-large +LLM=llama3.1 diff --git a/app/lib/llm.server.ts b/app/lib/llm.server.ts index 7c6609c..d227b3e 100644 --- a/app/lib/llm.server.ts +++ b/app/lib/llm.server.ts @@ -15,22 +15,24 @@ import { Principal } from "./users"; const OLLAMA_ENDPOINT = process.env.OLLAMA_ENDPOINT || "http://localhost:11434"; const CHROMA_ENDPOINT = process.env.CHROMA_ENDPOINT || "http://localhost:5666"; +const EMBEDDING_MODEL = process.env.EMBEDDING_MODEL || "mxbai-embed-large"; +const LLM = process.env.LLM || "llama3.1"; + export const CHROMA_COLLECTION_NAME = process.env.CHROMA_COLLECTION_NAME || "expense_dev"; const llm = new Ollama({ baseUrl: OLLAMA_ENDPOINT, - model: "llama3.1", // Default value + model: LLM, // Default value temperature: 0, maxRetries: 2, }); const embeddings = new OllamaEmbeddings({ - model: "mxbai-embed-large", // Default value + model: EMBEDDING_MODEL, // Default value baseUrl: OLLAMA_ENDPOINT, // Default value }); -console.log(CHROMA_ENDPOINT); export const vectorStore = new Chroma(embeddings, { collectionName: CHROMA_COLLECTION_NAME, url: CHROMA_ENDPOINT, // Optional, will default to this value diff --git a/package-lock.json b/package-lock.json index 5adc75c..2040b30 100644 --- a/package-lock.json +++ b/package-lock.json @@ -1,5 +1,5 @@ { - "name": "cerbos-rag-clean", + "name": "cerbos-rag", "lockfileVersion": 3, "requires": true, "packages": {