summaryrefslogtreecommitdiff
path: root/rag/upload.py
diff options
context:
space:
mode:
authorGustaf Rydholm <gustaf.rydholm@gmail.com>2024-04-14 23:14:21 +0200
committerGustaf Rydholm <gustaf.rydholm@gmail.com>2024-04-14 23:14:21 +0200
commitbd87b7fed75d5e504eb40c6616c2f1e1e56a0451 (patch)
treef6e3b68c48f150c8b6e6acd33d6e760f334a456d /rag/upload.py
parent3c59ed779e3b30ab4877ae94242c9df076df681a (diff)
Refactor cli
Diffstat (limited to 'rag/upload.py')
-rw-r--r--rag/upload.py30
1 files changed, 0 insertions, 30 deletions
diff --git a/rag/upload.py b/rag/upload.py
deleted file mode 100644
index 8567142..0000000
--- a/rag/upload.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from pathlib import Path
-
-import click
-from dotenv import load_dotenv
-from loguru import logger as log
-from tqdm import tqdm
-
-from rag.retriever.retriever import Retriever
-
-
-@click.command()
-@click.option(
- "-d",
- "--directory",
- help="The full path to the root directory containing pdfs to upload",
- type=click.Path(exists=True),
-)
-def main(directory: str):
- log.info(f"Uploading pfs found in directory {directory}...")
- retriever = Retriever()
- pdfs = Path(directory).glob("**/*.pdf")
- for path in tqdm(list(pdfs)):
- retriever.add_pdf(path=path)
-
-
-if __name__ == "__main__":
- log.remove()
- log.add(lambda msg: tqdm.write(msg, end=""), colorize=True)
- load_dotenv()
- main()