Spaces:

ammaan
/

youtubevideosummary

Sleeping

ammaan commited on May 13

Commit

47408f6

•

1 Parent(s): a4348b8

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -12,7 +12,7 @@ app = FastAPI()
 text_summary = pipeline("summarization", model="Falconsai/text_summarization")
-def extract_video_id(url) :
     regex = r"(?:youtube\.com\/(?:[^\/\n\s]+\/\S+\/|(?:v|e(?:mbed)?)\/|\S*?[?&]v=)|youtu\.be\/)([a-zA-Z0-9_-]{11})"
     match = re.search(regex, url)
     if match:
@@ -31,20 +31,6 @@ def get_youtube_transcript(video_url):
     except Exception as e:
         return f"An error occurred: {e}"
-def preprocess_text(text):
-    # Split the text into sentences
-    sentences = re.split(r'(?<=[.!?]) +', text)
-    return sentences
-def summarize_text(text):
-    try:
-        # Preprocess the text
-        sentences = preprocess_text(str(text))
-        # Summarize the text
-        summarized_text = text_summary(sentences)
-        return summarized_text[0]['summary_text']
-    except Exception as e:
-        return f"An error occurred: {e}"
 # Get the input from the frontend
 @app.get("/getdata")
@@ -52,8 +38,8 @@ def get_data(input):
     print(input)
     transcript = get_youtube_transcript(input)
     if transcript:
-        summary = summarize_text(transcript)
-        return {"summary": summary}
     else:
         return {"error": "Failed to get transcript from the YouTube video."}

 text_summary = pipeline("summarization", model="Falconsai/text_summarization")
+def extract_video_id(url):
     regex = r"(?:youtube\.com\/(?:[^\/\n\s]+\/\S+\/|(?:v|e(?:mbed)?)\/|\S*?[?&]v=)|youtu\.be\/)([a-zA-Z0-9_-]{11})"
     match = re.search(regex, url)
     if match:
     except Exception as e:
         return f"An error occurred: {e}"
 # Get the input from the frontend
 @app.get("/getdata")
     print(input)
     transcript = get_youtube_transcript(input)
     if transcript:
+        summary = text_summary(transcript,min_length=10,max_length=1000,do_sample=False)
+        return {"summary": summary[0]['summary_text']}
     else:
         return {"error": "Failed to get transcript from the YouTube video."}