diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2024-04-14 23:14:21 +0200 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2024-04-14 23:14:21 +0200 |
commit | bd87b7fed75d5e504eb40c6616c2f1e1e56a0451 (patch) | |
tree | f6e3b68c48f150c8b6e6acd33d6e760f334a456d /rag/upload.py | |
parent | 3c59ed779e3b30ab4877ae94242c9df076df681a (diff) |
Refactor cli
Diffstat (limited to 'rag/upload.py')
-rw-r--r-- | rag/upload.py | 30 |
1 files changed, 0 insertions, 30 deletions
diff --git a/rag/upload.py b/rag/upload.py deleted file mode 100644 index 8567142..0000000 --- a/rag/upload.py +++ /dev/null @@ -1,30 +0,0 @@ -from pathlib import Path - -import click -from dotenv import load_dotenv -from loguru import logger as log -from tqdm import tqdm - -from rag.retriever.retriever import Retriever - - -@click.command() -@click.option( - "-d", - "--directory", - help="The full path to the root directory containing pdfs to upload", - type=click.Path(exists=True), -) -def main(directory: str): - log.info(f"Uploading pfs found in directory {directory}...") - retriever = Retriever() - pdfs = Path(directory).glob("**/*.pdf") - for path in tqdm(list(pdfs)): - retriever.add_pdf(path=path) - - -if __name__ == "__main__": - log.remove() - log.add(lambda msg: tqdm.write(msg, end=""), colorize=True) - load_dotenv() - main() |