Spaces:

KushwanthK
/

vedic_scriptures

Sleeping

KushwanthK commited on May 19, 2024

Commit

f0b5e94

verified ·

1 Parent(s): f98ad5c

Upload 2 files

Files changed (2) hide show

app.py CHANGED Viewed

@@ -422,6 +422,8 @@ import nltk
 nltk.download('stopwords')
 from nltk.corpus import stopwords
 from collections import Counter
 def highlight_pdf(file_path, text_to_highlight, page_numbers):
     # Create a temporary file to save the modified PDF
@@ -484,6 +486,19 @@ def highlight_pdf(file_path, text_to_highlight, page_numbers):
 # Example usage
 # Function to display PDF in Streamlit
 def display_highlighted_pdf():
     pdf_path = "Bhagavad-Gita-As-It-Is.pdf"
@@ -494,12 +509,15 @@ def display_highlighted_pdf():
     print(highlighted_pdf_path)
-    with open(highlighted_pdf_path, "rb") as file:
-            pdf_bytes = file.read()
-        # Use pdf_viewer to display the PDF in Streamlit
-    pdf_viewer(pdf_bytes, width=700)
 display_highlighted_pdf()

 nltk.download('stopwords')
 from nltk.corpus import stopwords
 from collections import Counter
+from streamlit_image_zoom import image_zoom
+from PIL import Image
 def highlight_pdf(file_path, text_to_highlight, page_numbers):
     # Create a temporary file to save the modified PDF
 # Example usage
+def pdf_to_images(pdf_path, page_numbers):
+    doc = fitz.open(pdf_path)
+    images = []
+    for page_number in page_numbers:
+        page = doc.load_page(page_number - 1)
+        pix = page.get_pixmap()
+        img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
+        buf = io.BytesIO()
+        img.save(buf, format="PNG")
+        byte_im = buf.getvalue()
+        images.append(byte_im)
+    return images
 # Function to display PDF in Streamlit
 def display_highlighted_pdf():
     pdf_path = "Bhagavad-Gita-As-It-Is.pdf"
     print(highlighted_pdf_path)
+    # with open(highlighted_pdf_path, "rb") as file:
+    #     pdf_bytes = file.read()
+    #     # Use pdf_viewer to display the PDF in Streamlit
+    # pdf_viewer(pdf_bytes, width=700)
+    images = pdf_to_images(highlighted_pdf_path, sources)
+    for img in images:
+        image_zoom(img)
 display_highlighted_pdf()

requirements.txt CHANGED Viewed

@@ -1,22 +1,15 @@
-# pinecone-client[grpc]
-sentence-transformers==2.2.2
 datasets
 torch
 streamlit-chat-media
 streamlit-chat
-transformers==4.28.0
 PyPDF2
 ratelimit
 backoff
 tqdm
 openai
 PyMuPDF  # instead of fitz
-nltk
-langchain_community
-langchain
-# faiss-gpu
-faiss-cpu==1.7.2
-stqdm
-python-dotenv
-# langchain-huggingface
-streamlit_pdf_viewer

+sentence-transformers
 datasets
 torch
 streamlit-chat-media
 streamlit-chat
+transformers
 PyPDF2
 ratelimit
 backoff
 tqdm
 openai
 PyMuPDF  # instead of fitz
+reportlab
+PyPDF2Highlight
+streamlit-image-zoom