Spaces:

open-nlp
/

Chris-lab

Sleeping

App Files Files Community

etchen commited on Jul 23, 2024

Commit

43d8095

1 Parent(s): 679d21e

dataset poc

Browse files

Files changed (3) hide show

pages/summarization_example.py +8 -1
requirements.txt +2 -1
utils/data.py +4 -0

pages/summarization_example.py CHANGED Viewed

@@ -1,12 +1,15 @@
 from dotenv import load_dotenv
 import gradio as gr
 from utils.model import Model
 __default_model_name__ = "lmsys/vicuna-7b-v1.5"
 model = Model(__default_model_name__)
 load_dotenv()
 examples = {
     "example 1": """Boston's injury reporting for Kristaps Porziņģis has been fairly coy. He missed Game 3, but his coach told reporters just before Game 4 that was technically available, but with a catch.
 Joe Mazzulla said Porziņģis would "only be used in specific instances, if necessary." That sounds like the team doesn't want to risk further injury to his dislocated Posterior Tibialis (or some other body part, due to overcompensation for the ankle), unless it's in a desperate situation.
@@ -20,6 +23,8 @@ Expect the rookie's playing time to continue to climb in Game 5. It seems increa
 Lively has been absolutely relentless on the offensive glass all postseason. He makes solid decisions as a passer when his rolls don't immediately lead to dunks. And he's not a liability when caught defending guards or wings outside.
 All of that has led to postseason averages of 8.2 points, 7.6 rebounds, 1.4 assists and 1.0 blocks in just 21.9 minutes, as well as a double-double in 22 minutes of Game 4.
 Back in Boston, Kidd is going to rely on Lively even more. He'll play close to 30 minutes and reach double-figures in both scoring and rebounding again.""",
 }
 def generate_answer(sources, model_name, prompt):
@@ -39,6 +44,8 @@ def process_input(input_text, model_selection, prompt):
         return "Please fill the input to generate outputs."
 def update_input(example):
     return examples[example]
 def create_summarization_interface():
@@ -64,4 +71,4 @@ summarization: """, label='Input Prompting Template', lines=8, placeholder='Inpu
 if __name__ == "__main__":
     demo = create_summarization_interface()
-    demo.launch()

 from dotenv import load_dotenv
 import gradio as gr
+import random
 from utils.model import Model
+from utils.data import dataset
 __default_model_name__ = "lmsys/vicuna-7b-v1.5"
 model = Model(__default_model_name__)
 load_dotenv()
+random_label = '🔀 Random dialogue from dataset'
 examples = {
     "example 1": """Boston's injury reporting for Kristaps Porziņģis has been fairly coy. He missed Game 3, but his coach told reporters just before Game 4 that was technically available, but with a catch.
 Joe Mazzulla said Porziņģis would "only be used in specific instances, if necessary." That sounds like the team doesn't want to risk further injury to his dislocated Posterior Tibialis (or some other body part, due to overcompensation for the ankle), unless it's in a desperate situation.
 Lively has been absolutely relentless on the offensive glass all postseason. He makes solid decisions as a passer when his rolls don't immediately lead to dunks. And he's not a liability when caught defending guards or wings outside.
 All of that has led to postseason averages of 8.2 points, 7.6 rebounds, 1.4 assists and 1.0 blocks in just 21.9 minutes, as well as a double-double in 22 minutes of Game 4.
 Back in Boston, Kidd is going to rely on Lively even more. He'll play close to 30 minutes and reach double-figures in both scoring and rebounding again.""",
+    random_label: ""
 }
 def generate_answer(sources, model_name, prompt):
         return "Please fill the input to generate outputs."
 def update_input(example):
+    if example == random_label:
+        return random.choice(dataset)['dialogue']
     return examples[example]
 def create_summarization_interface():
 if __name__ == "__main__":
     demo = create_summarization_interface()
+    demo.launch()

requirements.txt CHANGED Viewed

@@ -6,4 +6,5 @@ sentencepiece
 gradio
 torch
 torchvision
-torchaudio

 gradio
 torch
 torchvision
+torchaudio
+datasets

utils/data.py ADDED Viewed

	@@ -0,0 +1,4 @@

+from datasets import load_dataset
+dialogsum = load_dataset('knkarthick/dialogsum')
+dataset = list(dialogsum['train']) + list(dialogsum['validation']) + list(dialogsum['test'])