Spaces:

minnehwg
/

youtube-summarizer

Running

minnehwg commited on Jun 3

Commit

9a1b6f5

•

1 Parent(s): 16e7c81

Update util.py

Files changed (1) hide show

util.py CHANGED Viewed

@@ -46,8 +46,8 @@ def get_subtitles(video_url):
 from youtube_transcript_api import YouTubeTranscriptApi
-def restore_punctuation(text):
-    model = PunctuationModel()
     result = model.restore_punctuation(text)
     return result
@@ -124,19 +124,3 @@ def display(text):
     return formatted_sentences
-def pipeline(url, model, tokenizer):
-    trans, sub = get_subtitles(url)
-    sub = restore_punctuation(sub)
-    vie_sub = translate_long(sub)
-    vie_sub = processed(vie_sub)
-    chunks = split_into_chunks(vie_sub, 700, 2)
-    sum_para = []
-    for i in chunks:
-        tmp = summarize(i, model, tokenizer, num_beams=3)
-        sum_para.append(tmp)
-    suma = ''.join(sum_para)
-    del sub, vie_sub, sum_para, chunks
-    suma = post_processing(suma)
-    re = display(suma)
-    return re

 from youtube_transcript_api import YouTubeTranscriptApi
+def restore_punctuation(text, model_restore):
+    model = model_restore
     result = model.restore_punctuation(text)
     return result
     return formatted_sentences