summaryrefslogtreecommitdiff
path: root/rag/llm
diff options
context:
space:
mode:
Diffstat (limited to 'rag/llm')
-rw-r--r--rag/llm/__init__.py0
-rw-r--r--rag/llm/encoder.py23
-rw-r--r--rag/llm/generator.py0
3 files changed, 23 insertions, 0 deletions
diff --git a/rag/llm/__init__.py b/rag/llm/__init__.py
new file mode 100644
index 0000000..e69de29
--- /dev/null
+++ b/rag/llm/__init__.py
diff --git a/rag/llm/encoder.py b/rag/llm/encoder.py
new file mode 100644
index 0000000..d5e0566
--- /dev/null
+++ b/rag/llm/encoder.py
@@ -0,0 +1,23 @@
+import os
+from typing import List
+
+import numpy as np
+import ollama
+
+
+class Encoder:
+ def __init__(self) -> None:
+ self.model = os.environ["ENCODER_MODEL"]
+ self.query_prompt = "Represent this sentence for searching relevant passages: "
+
+ def __encode(self, prompt: str) -> np.ndarray:
+ x = ollama.embeddings(model=ENCODER_MODEL, prompt=prompt)
+ x = np.array([x["embedding"]]).astype("float32")
+ return x
+
+ def encode(self, doc: List[str]) -> List[np.ndarray]:
+ return [self.__encode(chunk) for chunk in doc]
+
+ def query(self, query: str) -> np.ndarray:
+ query = self.query_prompt + query
+ return self.__encode(query)
diff --git a/rag/llm/generator.py b/rag/llm/generator.py
new file mode 100644
index 0000000..e69de29
--- /dev/null
+++ b/rag/llm/generator.py