Spaces:

pradeepsengarr
/

Custom_Rag_Bot

Running

pradeepsengarr commited on Jun 3

Commit

9a8a050

verified ·

1 Parent(s): f1e12d6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -31,18 +31,28 @@ doc_texts = []
 # Extract text from PDF or TXT
 def extract_text(file):
     text = ""
-    file_bytes = file.read()
-    if file.name.endswith(".pdf"):
         pdf_stream = BytesIO(file_bytes)
         doc = fitz.open(stream=pdf_stream, filetype="pdf")
         for page in doc:
             text += page.get_text()
-    elif file.name.endswith(".txt"):
         text = file_bytes.decode("utf-8")
     else:
         return "❌ Unsupported file type."
     return text
 # Process the file, build FAISS index
 def process_file(file):
     global index, doc_texts

 # Extract text from PDF or TXT
 def extract_text(file):
     text = ""
+    # Handle if file is a NamedString (like on HF Spaces)
+    if isinstance(file, str):
+        with open(file, "rb") as f:
+            file_bytes = f.read()
+        filename = file
+    else:
+        file_bytes = file.read()
+        filename = file.name
+    if filename.endswith(".pdf"):
         pdf_stream = BytesIO(file_bytes)
         doc = fitz.open(stream=pdf_stream, filetype="pdf")
         for page in doc:
             text += page.get_text()
+    elif filename.endswith(".txt"):
         text = file_bytes.decode("utf-8")
     else:
         return "❌ Unsupported file type."
     return text
 # Process the file, build FAISS index
 def process_file(file):
     global index, doc_texts