Spaces:

Shahbazakbar
/

TestGPT2ChatBot

Sleeping

App Files Files Community

Shahbazakbar commited on Feb 22, 2025

Commit

fb75b56

verified ·

1 Parent(s): 65f18a8

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -13

app.py CHANGED Viewed

@@ -5,14 +5,23 @@ import gradio as gr
 import fitz  # PyMuPDF
 import easyocr
 from PIL import Image
-# Load a lightweight model (e.g., DistilGPT-2)
-distilgpt2_tokenizer = AutoTokenizer.from_pretrained("distilgpt2")
-distilgpt2_model = AutoModelForCausalLM.from_pretrained("distilgpt2")
-# Move model to GPU if available
-if torch.cuda.is_available():
-    distilgpt2_model = distilgpt2_model.to("cuda")
 # Function to extract text from PDF
 def extract_text_from_pdf(pdf_path):
@@ -31,31 +40,66 @@ def extract_text_from_image(image_path):
 # Function to generate a response
 def generate_response(prompt):
-    inputs = distilgpt2_tokenizer(prompt, return_tensors="pt").to(distilgpt2_model.device)
-    outputs = distilgpt2_model.generate(**inputs, max_length=100)
-    response = distilgpt2_tokenizer.decode(outputs[0], skip_special_tokens=True)
     return response
 # Chatbot function to handle text, PDF, and image inputs
 def chatbot(input_type, text_input, pdf_input, image_input):
     if input_type == "Text":
         if not text_input:
             return "Please enter some text."
-        prompt = text_input
     elif input_type == "PDF":
         if pdf_input is None:
             return "Please upload a PDF file."
         pdf_text = extract_text_from_pdf(pdf_input)
-        prompt = f"Extracted text from PDF:\n{pdf_text}\n\nQuestion: {text_input}"
     elif input_type == "Image":
         if image_input is None:
             return "Please upload an image file."
         image_text = extract_text_from_image(image_input)
-        prompt = f"Extracted text from image:\n{image_text}\n\nQuestion: {text_input}"
     else:
         return "Invalid input type."
     # Generate response using the model
     response = generate_response(prompt)
     return response
@@ -72,7 +116,7 @@ interface = gr.Interface(
     fn=chatbot,
     inputs=input_components,
     outputs="text",
-    title="Lightweight Chatbot with PDF and Image Support",
     description="Select the input type (Text, PDF, or Image) and provide your input."
 )

 import fitz  # PyMuPDF
 import easyocr
 from PIL import Image
+from sentence_transformers import SentenceTransformer
+from chromadb import Client, Settings
+# Load Zephyr 7B (fine-tuned for chat)
+zephyr_tokenizer = AutoTokenizer.from_pretrained("HuggingFaceH4/zephyr-7b-alpha")
+zephyr_model = AutoModelForCausalLM.from_pretrained(
+    "HuggingFaceH4/zephyr-7b-alpha",
+    torch_dtype=torch.float16,  # Use half-precision for faster inference
+    device_map="auto"  # Automatically loads the model on GPU if available
+)
+# Load a sentence transformer model for embeddings
+embedding_model = SentenceTransformer("all-MiniLM-L6-v2")
+# Initialize Chroma client for RAG
+chroma_client = Client(Settings())
+collection = chroma_client.create_collection(name="knowledge_base")
 # Function to extract text from PDF
 def extract_text_from_pdf(pdf_path):
 # Function to generate a response
 def generate_response(prompt):
+    # Structure the input prompt for chat
+    formatted_prompt = f"<|user|>\n{prompt}\n<|assistant|>\n"
+    # Tokenize the input prompt
+    inputs = zephyr_tokenizer(formatted_prompt, return_tensors="pt").to(zephyr_model.device)
+    # Generate the response
+    outputs = zephyr_model.generate(**inputs, max_length=200)
+    # Decode the response
+    response = zephyr_tokenizer.decode(outputs[0], skip_special_tokens=True)
+    # Extract only the assistant's response
+    response = response.split("<|assistant|>")[-1].strip()
     return response
+# Function to add documents to the knowledge base
+def add_to_knowledge_base(text_chunks):
+    embeddings = embedding_model.encode(text_chunks)
+    for idx, (chunk, embedding) in enumerate(zip(text_chunks, embeddings)):
+        collection.add(
+            documents=[chunk],
+            embeddings=[embedding.tolist()],
+            ids=[str(idx)]
+        )
+# Function to retrieve relevant chunks
+def retrieve_relevant_chunks(query, top_k=3):
+    query_embedding = embedding_model.encode(query)
+    results = collection.query(
+        query_embeddings=[query_embedding.tolist()],
+        n_results=top_k
+    )
+    return results["documents"][0]
 # Chatbot function to handle text, PDF, and image inputs
 def chatbot(input_type, text_input, pdf_input, image_input):
     if input_type == "Text":
         if not text_input:
             return "Please enter some text."
+        query = text_input
     elif input_type == "PDF":
         if pdf_input is None:
             return "Please upload a PDF file."
         pdf_text = extract_text_from_pdf(pdf_input)
+        query = f"Extracted text from PDF:\n{pdf_text}\n\nQuestion: {text_input}"
     elif input_type == "Image":
         if image_input is None:
             return "Please upload an image file."
         image_text = extract_text_from_image(image_input)
+        query = f"Extracted text from image:\n{image_text}\n\nQuestion: {text_input}"
     else:
         return "Invalid input type."
+    # Retrieve relevant chunks from the knowledge base
+    relevant_chunks = retrieve_relevant_chunks(query)
+    context = "\n\n".join(relevant_chunks)
     # Generate response using the model
+    prompt = f"Context:\n{context}\n\nQuestion: {query}\n\nAnswer:"
     response = generate_response(prompt)
     return response
     fn=chatbot,
     inputs=input_components,
     outputs="text",
+    title="RAG Chatbot with PDF and Image Support",
     description="Select the input type (Text, PDF, or Image) and provide your input."
 )