summaryrefslogtreecommitdiff
path: root/rag/rag.py
blob: 5b5f5ab83b176c28218ba5a3dce93b16183b64a3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
from pathlib import Path
from typing import List, Optional

from langchain_core.documents.base import Document
from llm.encoder import Encoder
from llm.generator import Generator
from parser import pdf
from db.documents import Documents
from db.vectors import Vectors


class RAG:
    def __init__(self) -> None:
        self.generator = Generator()
        self.encoder = Encoder()
        self.docs = Documents()
        self.vectors = Vectors()

    def add_pdf(self, filepath: Path) -> Optional[List[Document]]:
        chunks = pdf.parser(filepath)