summaryrefslogtreecommitdiff
path: root/rag/rag.py
blob: 1f6a17606c7133f622c136434a8189c447ffcda1 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
from dataclasses import dataclass
from typing import Any, Dict, Generator, List

from loguru import logger as log

from rag.generator import get_generator
from rag.generator.prompt import Prompt
from rag.retriever.rerank import get_reranker
from rag.retriever.retriever import Retriever
from rag.retriever.vector import Document


@dataclass
class Message:
    role: str
    content: str
    client: str

    def as_dict(self) -> Dict[str, str]:
        if self.client == "cohere":
            return {"role": self.role, "message": self.content}
        else:
            return {"role": self.role, "content": self.content}


class Rag:
    def __init__(self, client: str) -> None:
        self.messages: List[Message] = []
        self.retriever = Retriever()
        self.client = client
        self.reranker = get_reranker(self.client)
        self.generator = get_generator(self.client)
        self.bot = "assistant" if self.client == "ollama" else "CHATBOT"
        self.user = "user" if self.client == "ollama" else "USER"

    def __set_roles(self):
        self.bot = "assistant" if self.client == "ollama" else "CHATBOT"
        self.user = "user" if self.client == "ollama" else "USER"

    def set_client(self, client: str):
        self.client = client
        self.reranker = get_reranker(self.client)
        self.generator = get_generator(self.client)
        self.__set_roles()
        self.__reset_messages()
        log.debug(f"Swapped client to {self.client}")

    def __reset_messages(self):
        log.debug("Deleting messages...")
        self.messages = []

    def retrieve(self, query: str) -> List[Document]:
        documents = self.retriever.retrieve(query)
        log.info(f"Found {len(documents)} relevant documents")
        return self.reranker.rerank_documents(query, documents)

    def add_message(self, role: str, content: str):
        self.messages.append(
            Message(role=role, content=content, client=self.client)
        )

    def generate(self, prompt: Prompt) -> Generator[Any, Any, Any]:
        messages = self.reranker.rerank_messages(prompt.query, self.messages)
        self.messages.append(
            Message(
                role=self.user, content=prompt.to_str(), client=self.client
            )
        )
        return self.generator.generate(prompt, messages)