VoiceGPT15

Sleeping

awacke1 commited on Jul 7, 2023

Commit

03d5e6b

•

1 Parent(s): bf4227b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -203,7 +203,9 @@ def extract_mime_type(file):
     else:
         raise TypeError("Input should be a string or a streamlit.UploadedFile object")
-from io import BytesIO
 def extract_file_extension(file):
     # get the file name directly from the UploadedFile object
@@ -229,8 +231,12 @@ def pdf2txt(docs):
         # read the file according to its extension
         try:
-            if file_extension.lower() in ['txt', 'html', 'htm', 'py', 'xml', 'json', 'docx']:
-                text += textract.process(temp_file_name).decode("utf-8")
             elif file_extension.lower() == 'pdf':
                 with open(temp_file_name, "rb") as f:
                     pdf = PdfFileReader(f)
@@ -245,6 +251,7 @@ def pdf2txt(docs):
     return text
 def pdf2txt_old(pdf_docs):
     st.write(pdf_docs)
     for file in pdf_docs:

     else:
         raise TypeError("Input should be a string or a streamlit.UploadedFile object")
+from PyPDF2 import PdfFileReader
+import os
+import re
 def extract_file_extension(file):
     # get the file name directly from the UploadedFile object
         # read the file according to its extension
         try:
+            if file_extension.lower() == 'py':
+                with open(temp_file_name, 'r') as f:
+                    text += f.read()
+            elif file_extension.lower() in ['txt', 'html', 'htm', 'xml', 'json']:
+                with open(temp_file_name, 'r') as f:
+                    text += f.read()
             elif file_extension.lower() == 'pdf':
                 with open(temp_file_name, "rb") as f:
                     pdf = PdfFileReader(f)
     return text
 def pdf2txt_old(pdf_docs):
     st.write(pdf_docs)
     for file in pdf_docs: