Spaces:

mitulagr2
/

whatsthispdf

Runtime error

mitulagr2 commited on Jul 8

Commit

4c88907

•

1 Parent(s): 82c3144

Update rag.py

Files changed (2) hide show

app/main.py CHANGED Viewed

@@ -66,9 +66,7 @@ async def websocket_endpoint(websocket: WebSocket, client_id: int):
 @app.post("/upload")
-def upload(files: list[UploadFile]):
-    session_assistant.clear()
     try:
         os.makedirs(files_dir)
         for file in files:
@@ -86,6 +84,12 @@ def upload(files: list[UploadFile]):
     return "Files inserted!"
 @app.get("/")
 def ping():
     return "Pong!"

 @app.post("/upload")
+def upload(files: list[UploadFile]):
     try:
         os.makedirs(files_dir)
         for file in files:
     return "Files inserted!"
+@app.get("/clear")
+def ping():
+    session_assistant.clear()
+    return "All files have been cleared."
 @app.get("/")
 def ping():
     return "Pong!"

app/rag.py CHANGED Viewed

@@ -22,6 +22,8 @@ logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 class ChatPDF:
     def __init__(self):
         self.text_parser = SentenceSplitter(chunk_size=512, chunk_overlap=24)
@@ -70,6 +72,7 @@ class ChatPDF:
         logger.info("enumerating docs")
         for doc_idx, doc in enumerate(docs):
             curr_text_chunks = self.text_parser.split_text(doc.text)
             text_chunks.extend(curr_text_chunks)
             doc_ids.extend([doc_idx] * len(curr_text_chunks))
@@ -104,8 +107,11 @@ class ChatPDF:
     def ask(self, query: str):
         logger.info("retrieving the response to the query")
         streaming_response = self.query_engine.query(query)
         return streaming_response.response_gen
     def clear(self):
-        pass

 logger = logging.getLogger(__name__)
 class ChatPDF:
+    pdf_count = 0
     def __init__(self):
         self.text_parser = SentenceSplitter(chunk_size=512, chunk_overlap=24)
         logger.info("enumerating docs")
         for doc_idx, doc in enumerate(docs):
+            self.pdf_count = self.pdf_count + 1
             curr_text_chunks = self.text_parser.split_text(doc.text)
             text_chunks.extend(curr_text_chunks)
             doc_ids.extend([doc_idx] * len(curr_text_chunks))
     def ask(self, query: str):
         logger.info("retrieving the response to the query")
+        if not self.pdf_count > 0:
+            return "Please, add a PDF document first."
         streaming_response = self.query_engine.query(query)
         return streaming_response.response_gen
     def clear(self):
+        self.pdf_count = 0