Spaces:

wldmr
/

tubifier

Sleeping

wldmr commited on Nov 14, 2022

Commit

ee90b6b

•

1 Parent(s): c05de66

app file

Files changed (3) hide show

app.py CHANGED Viewed

@@ -37,7 +37,7 @@ def image_mod(link):
     json_file = su.getSummary(link, lexrank_switch, rpunkt_switch)
     #html, images = su.getSummary(link, lexrank_switch, rpunkt_switch)
     #images = su.getSummaryImage(link, lexrank_switch, rpunkt_switch)
-    print(html)
     files = os.listdir('workdir/')
     print('local files: ',files)
@@ -51,7 +51,7 @@ def image_mod(link):
     #images[0].save("newlion.png")
-    print('images',images)
     #return {"html": html, "images":images}
     #return HTMLResponse(content=html)

     json_file = su.getSummary(link, lexrank_switch, rpunkt_switch)
     #html, images = su.getSummary(link, lexrank_switch, rpunkt_switch)
     #images = su.getSummaryImage(link, lexrank_switch, rpunkt_switch)
+    #print(html)
     files = os.listdir('workdir/')
     print('local files: ',files)
     #images[0].save("newlion.png")
+    #print('images',images)
     #return {"html": html, "images":images}
     #return HTMLResponse(content=html)

summarizer.py CHANGED Viewed

@@ -79,7 +79,8 @@ def getSummary(link, lexrank_switch, rpunkt_switch):
         return 'Error: no link provided'
     print('getting transcript using link: ', link)
-    raw_transcript, type_transcript = ts.get_json_transcript(link,rpunkt_switch)
     print('transcript type: ', type_transcript)
     #timestamps = ts.get_timestamps(raw_transcript)
     raw_caption = ts.get_caption(raw_transcript)

         return 'Error: no link provided'
     print('getting transcript using link: ', link)
+    video_id = get_id_from_link(link)
+    raw_transcript, type_transcript = ts.get_json_transcript(video_id,rpunkt_switch)
     print('transcript type: ', type_transcript)
     #timestamps = ts.get_timestamps(raw_transcript)
     raw_caption = ts.get_caption(raw_transcript)

transcript.py CHANGED Viewed

@@ -7,13 +7,19 @@ import base64
 #transcript_list = YouTubeTranscriptApi.list_transcripts('ReHGSGwV4-A')
 #transcript = transcript_list.find_transcript(['en','de'])
-# step 1: download the json transcript for youtube video
-def get_json_transcript(link,rpunkt_switch):
     if "v=" in link:
         video_id = link.split("v=")[1].split("&")[0]
     else:
         return "Error: Invalid Link, it does not have the pattern 'v=' in it."
     transcript_list = YouTubeTranscriptApi.list_transcripts(video_id)
     # get the auto-generated english text

 #transcript_list = YouTubeTranscriptApi.list_transcripts('ReHGSGwV4-A')
 #transcript = transcript_list.find_transcript(['en','de'])
+def get_id_from_link(link):
+    video_id = ""
     if "v=" in link:
         video_id = link.split("v=")[1].split("&")[0]
+    elif len(link)==11:
     else:
         return "Error: Invalid Link, it does not have the pattern 'v=' in it."
+    return video_id
+# step 1: download the json transcript for youtube video
+def get_json_transcript(video_id,rpunkt_switch):
     transcript_list = YouTubeTranscriptApi.list_transcripts(video_id)
     # get the auto-generated english text