RAGBOT

Running

Rahatara commited on 6 days ago

Commit

0b6997c

•

1 Parent(s): 3c3edd2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -19,16 +19,17 @@ class MyApp:
         self.index = None
         self.model = SentenceTransformer('all-MiniLM-L6-v2')
-    def load_pdfs(self, files: List[gr.File]) -> str:
         """Extracts text from multiple PDF files and stores them."""
         self.documents = []
-        for file in files:
-            doc = fitz.open(stream=file.read(), filetype="pdf")
             for page_num in range(len(doc)):
                 page = doc[page_num]
                 text = page.get_text()
                 self.documents.append({
-                    "file_name": file.name,
                     "page": page_num + 1,
                     "content": text
                 })
@@ -55,7 +56,7 @@ class MyApp:
 app = MyApp()
-def upload_files(files: List[gr.File]) -> str:
     return app.load_pdfs(files)
 def build_vector_db() -> str:

         self.index = None
         self.model = SentenceTransformer('all-MiniLM-L6-v2')
+    def load_pdfs(self, files: List[Dict]) -> str:
         """Extracts text from multiple PDF files and stores them."""
         self.documents = []
+        for file_dict in files:
+            file_path = file_dict['name']  # Access the file path
+            doc = fitz.open(file_path)  # Open the PDF using the file path
             for page_num in range(len(doc)):
                 page = doc[page_num]
                 text = page.get_text()
                 self.documents.append({
+                    "file_name": os.path.basename(file_path),
                     "page": page_num + 1,
                     "content": text
                 })
 app = MyApp()
+def upload_files(files: List[Dict]) -> str:
     return app.load_pdfs(files)
 def build_vector_db() -> str: