Spaces:

storresbusquets
/

llm-demo1

Runtime error

App Files Files Community

storresbusquets commited on Sep 19, 2023

Commit

549e47a

•

1 Parent(s): b8e3183

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -23

app.py CHANGED Viewed

@@ -307,8 +307,7 @@ class GradioInference:
     def from_article(self, article, progress=gr.Progress()):
         """
         Call the Gradio Inference python class.
-        Uses it directly the Whisper model to perform Automatic Speech Recognition (i.e Speech-to-Text).
-        Once the function has the transcription of the video it proccess it to obtain:
             - Summary: using Facebook's BART transformer.
             - KeyWords: using VoiceLabT5 keyword extractor.
             - Sentiment Analysis: using Hugging Face's default sentiment classifier
@@ -320,14 +319,14 @@ class GradioInference:
         # Perform summarization on the transcription
         transcription_summary = self.bart_summarizer(
-            results["text"], max_length=150, min_length=30, do_sample=False, truncation=True
         )
         #### Resumen multilingue
         WHITESPACE_HANDLER = lambda k: re.sub('\s+', ' ', re.sub('\n+', ' ', k.strip()))
         input_ids_sum = self.mt5_tokenizer(
-            [WHITESPACE_HANDLER(results["text"])],
             return_tensors="pt",
             padding="max_length",
             truncation=True,
@@ -352,7 +351,7 @@ class GradioInference:
         # Extract keywords using VoiceLabT5
         task_prefix = "Keywords: "
-        input_sequence = task_prefix + results["text"]
         input_ids = self.keyword_tokenizer(
             input_sequence,
@@ -387,26 +386,16 @@ class GradioInference:
         progress(0.90, desc="Generating Wordcloud")
         # WordCloud object
         wordcloud = WordCloud(colormap = "Oranges").generate(
-            results["text"]
         )
         wordcloud_image = wordcloud.to_image()
-        if lang == "english" or lang == "none":
-            return (
-                results["text"],
-                transcription_summary[0]["summary_text"],
-                formatted_keywords,
-                formatted_sentiment,
-                wordcloud_image,
-            )
-        else:
-            return (
-                results["text"],
-                summary,
-                formatted_keywords,
-                formatted_sentiment,
-                wordcloud_image,
-            )
 gio = GradioInference()
@@ -428,7 +417,7 @@ with block as demo:
         </div>
         """
     )
-    with gr.Group(spacing_size="md", radius_size="md"):
         with gr.Tab("From YouTube 📹"):
             with gr.Box():

     def from_article(self, article, progress=gr.Progress()):
         """
         Call the Gradio Inference python class.
+        Acepts the user's text imput, then it performs:
             - Summary: using Facebook's BART transformer.
             - KeyWords: using VoiceLabT5 keyword extractor.
             - Sentiment Analysis: using Hugging Face's default sentiment classifier
         # Perform summarization on the transcription
         transcription_summary = self.bart_summarizer(
+            article, max_length=150, min_length=30, do_sample=False, truncation=True
         )
         #### Resumen multilingue
         WHITESPACE_HANDLER = lambda k: re.sub('\s+', ' ', re.sub('\n+', ' ', k.strip()))
         input_ids_sum = self.mt5_tokenizer(
+            [WHITESPACE_HANDLER(article)],
             return_tensors="pt",
             padding="max_length",
             truncation=True,
         # Extract keywords using VoiceLabT5
         task_prefix = "Keywords: "
+        input_sequence = task_prefix + article
         input_ids = self.keyword_tokenizer(
             input_sequence,
         progress(0.90, desc="Generating Wordcloud")
         # WordCloud object
         wordcloud = WordCloud(colormap = "Oranges").generate(
+            article
         )
         wordcloud_image = wordcloud.to_image()
+        return (
+            transcription_summary[0]["summary_text"],
+            formatted_keywords,
+            formatted_sentiment,
+            wordcloud_image,
+        )
 gio = GradioInference()
         </div>
         """
     )
+    with gr.Group():
         with gr.Tab("From YouTube 📹"):
             with gr.Box():