From 95305f59df84caded50286b1a57b6075e48725a8 Mon Sep 17 00:00:00 2001 From: Gustaf Rydholm Date: Wed, 24 Apr 2024 01:10:43 +0200 Subject: Rerank working llama3 sucks at rag --- README.md | 24 +++++++++++++++--------- 1 file changed, 15 insertions(+), 9 deletions(-) (limited to 'README.md') diff --git a/README.md b/README.md index aeabf5f..718b66d 100644 --- a/README.md +++ b/README.md @@ -12,21 +12,27 @@ RAG with ollama (and optionally cohere) and qdrant. This is basically a glorifie Create a .env file or set the following parameters: ```.env -CHUNK_SIZE = -CHUNK_OVERLAP = +CHUNK_SIZE = 4096 +CHUNK_OVERLAP = 256 -ENCODER_MODEL = -EMBEDDING_DIM = +ENCODER_MODEL = "nomic-embed-text" +EMBEDDING_DIM = 768 +RETRIEVER_TOP_K = 15 +RETRIEVER_SCORE_THRESHOLD = 0.5 -GENERATOR_MODEL = +RERANK_MODEL = "mixedbread-ai/mxbai-rerank-large-v1" +RERANK_TOP_K = 5 -DOCUMENT_DB_NAME = -DOCUMENT_DB_USER = +GENERATOR_MODEL = "dolphin-llama3" -QDRANT_URL = -QDRANT_COLLECTION_NAME = +DOCUMENT_DB_NAME = "rag" +DOCUMENT_DB_USER = "aktersnurra" + +QDRANT_URL = "http://localhost:6333" +QDRANT_COLLECTION_NAME = "knowledge-base" COHERE_API_KEY = # OPTIONAL +COHERE_RERANK_MODEL = "rerank-english-v3.0" ``` ### 2. Ollama -- cgit v1.2.3-70-g09d2