Spaces:

pradeepsengarr
/

Custom_Rag_Bot

Running

App Files Files Community

pradeepsengarr commited on about 1 month ago

Commit

b7194cd

verified ·

1 Parent(s): 14b7206

Update app.py

Browse files

Files changed (1) hide show

app.py +80 -47

app.py CHANGED Viewed

@@ -4,7 +4,8 @@ import fitz
 import faiss
 import numpy as np
 from sentence_transformers import SentenceTransformer
-from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 from langchain.text_splitter import RecursiveCharacterTextSplitter
 from huggingface_hub import login
@@ -13,79 +14,111 @@ if not hf_token:
     raise ValueError("Hugging Face token not found.")
 login(token=hf_token)
 embed_model = SentenceTransformer("BAAI/bge-base-en-v1.5")
-model_id = "tiiuae/falcon-rw-1b"
 tokenizer = AutoTokenizer.from_pretrained(model_id, token=hf_token)
-model = AutoModelForCausalLM.from_pretrained(model_id, device_map={"": "cpu"}, torch_dtype="auto", token=hf_token)
 llm = pipeline("text-generation", model=model, tokenizer=tokenizer)
 index = None
 doc_texts = []
 def extract_text(file):
-    text = ""
-    file_path = file.name if hasattr(file, 'name') else file
-    if file_path.endswith(".pdf"):
-        with fitz.open(file_path) as doc:
-            for page in doc:
-                text += page.get_text()
-    elif file_path.endswith(".txt"):
-        with open(file_path, "r", encoding="utf-8") as f:
-            text = f.read()
-    else:
-        return "Unsupported file type."
-    return text
 def process_file(file):
     global index, doc_texts
-    text = extract_text(file)
-    if text.startswith("Unsupported"):
-        return text
-    splitter = RecursiveCharacterTextSplitter(chunk_size=300, chunk_overlap=50)
-    doc_texts = splitter.split_text(text)
-    embeddings = embed_model.encode(doc_texts, convert_to_numpy=True)
-    dim = embeddings.shape[1]
-    index = faiss.IndexFlatL2(dim)
-    index.add(embeddings)
-    return "Document processed successfully. You can now ask questions."
-def generate_answer(question):
-    global index, doc_texts
-    if index is None or not doc_texts:
-        return "Please upload and process a document first."
-    question_emb = embed_model.encode([question], convert_to_numpy=True)
-    _, I = index.search(question_emb, k=3)
-    context = "\n".join([doc_texts[i] for i in I[0]])
-    prompt = (
-        f"You are an intelligent assistant. Use the context below to answer the user's question clearly, "
-        f"politely, and completely. Do not just extract text — give a helpful response.\n\n"
-        f"Context:\n{context}\n\n"
-        f"User's Question: {question}\n\n"
-        f"Answer:"
-    )
-    result = llm(prompt, max_new_tokens=200, do_sample=True, temperature=0.7)
-    return result[0]["generated_text"].split("Answer:")[-1].strip()
-with gr.Blocks(title="Document Q&A Assistant") as demo:
     gr.Markdown("<h1 style='text-align: center;'>📄 Document AI Assistant</h1>")
-    gr.Markdown("Upload a PDF or TXT file, and ask questions about its content. The assistant will provide answers using the document as context.")
     with gr.Row():
         file_input = gr.File(label="Upload PDF or TXT", file_types=[".pdf", ".txt"])
         upload_output = gr.Textbox(label="Upload Status")
     with gr.Row():
-        question_input = gr.Textbox(label="Ask a Question", placeholder="What is this document about?")
         answer_output = gr.Textbox(label="Answer")
     file_input.change(fn=process_file, inputs=file_input, outputs=upload_output)
     question_input.submit(fn=generate_answer, inputs=question_input, outputs=answer_output)
-demo.launch()

 import faiss
 import numpy as np
 from sentence_transformers import SentenceTransformer
+from transformers import AutoTokenizer, pipeline
+from transformers import BitsAndBytesConfig, AutoModelForCausalLM
 from langchain.text_splitter import RecursiveCharacterTextSplitter
 from huggingface_hub import login
     raise ValueError("Hugging Face token not found.")
 login(token=hf_token)
+# Load embedding model
 embed_model = SentenceTransformer("BAAI/bge-base-en-v1.5")
+# Load quantized Mistral with 8-bit
+model_id = "mistralai/Mistral-7B-Instruct-v0.1"
+bnb_config = BitsAndBytesConfig(
+    load_in_8bit=True,
+    llm_int8_threshold=6.0,
+    llm_int8_skip_modules=None,
+)
 tokenizer = AutoTokenizer.from_pretrained(model_id, token=hf_token)
+model = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    quantization_config=bnb_config,
+    device_map="auto",
+    token=hf_token
+)
 llm = pipeline("text-generation", model=model, tokenizer=tokenizer)
+# State
 index = None
 doc_texts = []
+# Extract text
 def extract_text(file):
+    try:
+        text = ""
+        file_path = file.name if hasattr(file, 'name') else file
+        if file_path.endswith(".pdf"):
+            with fitz.open(file_path) as doc:
+                for page in doc:
+                    text += page.get_text()
+        elif file_path.endswith(".txt"):
+            with open(file_path, "r", encoding="utf-8") as f:
+                text = f.read()
+        else:
+            return "❌ Unsupported file type."
+        return text
+    except Exception as e:
+        return f"❌ Error extracting text: {e}"
+# Process file
 def process_file(file):
     global index, doc_texts
+    try:
+        text = extract_text(file)
+        if text.startswith("❌"):
+            return text
+        # Trim large documents
+        text = text[:15000]
+        splitter = RecursiveCharacterTextSplitter(chunk_size=300, chunk_overlap=50)
+        doc_texts = splitter.split_text(text)
+        if not doc_texts:
+            return "❌ Could not split document."
+        embeddings = embed_model.encode(doc_texts, convert_to_numpy=True)
+        dim = embeddings.shape[1]
+        index = faiss.IndexFlatL2(dim)
+        index.add(embeddings)
+        return "✅ Document processed. You may ask your question below."
+    except Exception as e:
+        return f"❌ Error processing file: {e}"
+# Answer generator
+def generate_answer(question):
+    global index, doc_texts
+    try:
+        if index is None or not doc_texts:
+            return "⚠️ Please upload and process a document first."
+        question_emb = embed_model.encode([question], convert_to_numpy=True)
+        _, I = index.search(question_emb, k=3)
+        context = "\n".join([doc_texts[i] for i in I[0]])
+        prompt = (
+            f"You are a helpful assistant. Use the context below to answer the question clearly.\n\n"
+            f"Context:\n{context}\n\n"
+            f"Question: {question}\n\n"
+            f"Answer:"
+        )
+        result = llm(prompt, max_new_tokens=200, do_sample=True, temperature=0.7)
+        return result[0]["generated_text"].split("Answer:")[-1].strip()
+    except Exception as e:
+        return f"❌ Error generating answer: {e}"
+# Gradio UI
+with gr.Blocks(title="📄 Document Q&A Assistant") as demo:
     gr.Markdown("<h1 style='text-align: center;'>📄 Document AI Assistant</h1>")
+    gr.Markdown("Upload a PDF or TXT file, and ask questions about its content. The assistant uses Mistral 7B (quantized) for reasoning.")
     with gr.Row():
         file_input = gr.File(label="Upload PDF or TXT", file_types=[".pdf", ".txt"])
         upload_output = gr.Textbox(label="Upload Status")
     with gr.Row():
+        question_input = gr.Textbox(label="Ask a Question", placeholder="e.g. What is the summary?")
         answer_output = gr.Textbox(label="Answer")
     file_input.change(fn=process_file, inputs=file_input, outputs=upload_output)
     question_input.submit(fn=generate_answer, inputs=question_input, outputs=answer_output)
+demo.launch(show_error=True, share=False)