Spaces:

clarin-knext
/

dialogue-state-tracking

Runtime error

App Files Files Community

juanpablo4l commited on Jun 29, 2023

Commit

d0fad25

•

1 Parent(s): 857aac4

Added NLG models

Browse files

Files changed (2) hide show

app.py +17 -3
models.py +57 -12

app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import gradio as gr
-from models import MODELS, PIPELINES
 def predict(text: str, model_name: str) -> str:
@@ -9,16 +9,30 @@ def predict(text: str, model_name: str) -> str:
 with gr.Blocks(title="CLARIN-PL Dialogue System Modules") as demo:
     gr.Markdown("Dialogue State Tracking Modules")
-    for model_name in MODELS:
         with gr.Row():
             gr.Markdown(f"## {model_name}")
             model_name_component = gr.Textbox(value=model_name, visible=False)
         with gr.Row():
-            text_input = gr.Textbox(label="Input Text", value=MODELS[model_name]["default_input"])
             output = gr.Textbox(label="Slot Value", value="")
         with gr.Row():
             predict_button = gr.Button("Predict")
             predict_button.click(fn=predict, inputs=[text_input, model_name_component], outputs=output)
 demo.queue(concurrency_count=3)
 demo.launch()

 import gradio as gr
+from models import DST_MODELS, NLG_MODELS, PIPELINES
 def predict(text: str, model_name: str) -> str:
 with gr.Blocks(title="CLARIN-PL Dialogue System Modules") as demo:
     gr.Markdown("Dialogue State Tracking Modules")
+    for model_name in DST_MODELS:
         with gr.Row():
             gr.Markdown(f"## {model_name}")
             model_name_component = gr.Textbox(value=model_name, visible=False)
         with gr.Row():
+            text_input = gr.Textbox(label="Input Text", value=DST_MODELS[model_name]["default_input"])
             output = gr.Textbox(label="Slot Value", value="")
         with gr.Row():
             predict_button = gr.Button("Predict")
             predict_button.click(fn=predict, inputs=[text_input, model_name_component], outputs=output)
+    gr.Markdown("Natural Language Generation / Paraphrasing Modules")
+    for model_name in NLG_MODELS:
+        with gr.Row():
+            gr.Markdown(f"## {model_name}")
+            model_name_component = gr.Textbox(value=model_name, visible=False)
+        with gr.Row():
+            text_input = gr.Textbox(label="Input Text", value=NLG_MODELS[model_name]["default_input"])
+            output = gr.Textbox(label="Slot Value", value="")
+        with gr.Row():
+            predict_button = gr.Button("Predict")
+            predict_button.click(fn=predict, inputs=[text_input, model_name_component], outputs=output)
 demo.queue(concurrency_count=3)
 demo.launch()

models.py CHANGED Viewed

@@ -2,11 +2,12 @@ import os
 from typing import Any, Dict
 from transformers import (Pipeline, T5ForConditionalGeneration, T5Tokenizer,
-                          pipeline)
 auth_token = os.environ.get("CLARIN_KNEXT")
-DEFAULT_INPUTS: Dict[str, str] = {
     "polish": (
         "[U] Chciałbym zarezerwować stolik na 4 osoby na piątek o godzinie 18:30. "
         "[Dziedzina] Restauracje: Popularna usługa wyszukiwania i rezerwacji restauracji "
@@ -19,47 +20,91 @@ DEFAULT_INPUTS: Dict[str, str] = {
     ),
 }
-MODELS: Dict[str, Dict[str, Any]] = {
     "plt5-small": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/plt5-small-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/plt5-small-dst", use_auth_token=auth_token),
-        "default_input": DEFAULT_INPUTS["polish"],
     },
     "plt5-base": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/plt5-base-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/plt5-base-dst", use_auth_token=auth_token),
-        "default_input": DEFAULT_INPUTS["polish"],
     },
     "plt5-base-poquad-dst-v2": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/plt5-base-poquad-dst-v2", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/plt5-base-poquad-dst-v2", use_auth_token=auth_token),
-        "default_input": DEFAULT_INPUTS["polish"],
     },
     "t5-small": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/t5-small-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/t5-small-dst", use_auth_token=auth_token),
-        "default_input": DEFAULT_INPUTS["english"],
     },
     "t5-base": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/t5-base-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/t5-base-dst", use_auth_token=auth_token),
-        "default_input": DEFAULT_INPUTS["english"],
     },
     "flant5-small [EN/PL]": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/flant5-small-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/flant5-small-dst", use_auth_token=auth_token),
-        "default_input": DEFAULT_INPUTS["english"],
     },
     "flant5-base [EN/PL]": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/flant5-base-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/flant5-base-dst", use_auth_token=auth_token),
-        "default_input": DEFAULT_INPUTS["english"],
     },
 }
 PIPELINES: Dict[str, Pipeline] = {
     model_name: pipeline(
-        "text2text-generation", model=MODELS[model_name]["model"], tokenizer=MODELS[model_name]["tokenizer"]
     )
-    for model_name in MODELS
 }

 from typing import Any, Dict
 from transformers import (Pipeline, T5ForConditionalGeneration, T5Tokenizer,
+                          pipeline, AutoModelForSeq2SeqLM, AutoModelForCausalLM, AutoTokenizer)
 auth_token = os.environ.get("CLARIN_KNEXT")
+DEFAULT_DST_INPUTS: Dict[str, str] = {
     "polish": (
         "[U] Chciałbym zarezerwować stolik na 4 osoby na piątek o godzinie 18:30. "
         "[Dziedzina] Restauracje: Popularna usługa wyszukiwania i rezerwacji restauracji "
     ),
 }
+DST_MODELS: Dict[str, Dict[str, Any]] = {
     "plt5-small": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/plt5-small-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/plt5-small-dst", use_auth_token=auth_token),
+        "default_input": DEFAULT_DST_INPUTS["polish"],
     },
     "plt5-base": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/plt5-base-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/plt5-base-dst", use_auth_token=auth_token),
+        "default_input": DEFAULT_DST_INPUTS["polish"],
     },
     "plt5-base-poquad-dst-v2": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/plt5-base-poquad-dst-v2", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/plt5-base-poquad-dst-v2", use_auth_token=auth_token),
+        "default_input": DEFAULT_DST_INPUTS["polish"],
     },
     "t5-small": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/t5-small-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/t5-small-dst", use_auth_token=auth_token),
+        "default_input": DEFAULT_DST_INPUTS["english"],
     },
     "t5-base": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/t5-base-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/t5-base-dst", use_auth_token=auth_token),
+        "default_input": DEFAULT_DST_INPUTS["english"],
     },
     "flant5-small [EN/PL]": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/flant5-small-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/flant5-small-dst", use_auth_token=auth_token),
+        "default_input": DEFAULT_DST_INPUTS["english"],
     },
     "flant5-base [EN/PL]": {
         "model": T5ForConditionalGeneration.from_pretrained("clarin-knext/flant5-base-dst", use_auth_token=auth_token),
         "tokenizer": T5Tokenizer.from_pretrained("clarin-knext/flant5-base-dst", use_auth_token=auth_token),
+        "default_input": DEFAULT_DST_INPUTS["english"],
+    },
+}
+DEFAULT_ENCODER_DECODER_INPUT_EN = "The alarm is set for 6 am. The alarm's name is name \"Get up\"."
+DEFAULT_DECODER_ONLY_INPUT_EN = f"[BOS]{DEFAULT_ENCODER_DECODER_INPUT_EN}[SEP]"
+DEFAULT_ENCODER_DECODER_INPUT_PL = "Alarm jest o godzinie 6 rano. Alarm ma nazwę \"Obudź się\"."
+DEFAULT_DECODER_ONLY_INPUT_PL = f"[BOS]{DEFAULT_ENCODER_DECODER_INPUT_PL}[SEP]"
+NLG_MODELS: Dict[str, Dict[str, Any]] = {
+    # English
+    "t5-large": {
+        "model": AutoModelForSeq2SeqLM.from_pretrained("clarin-knext/utterance-rewriting-t5-large", use_auth_token=auth_token),
+        "tokenizer": AutoTokenizer.from_pretrained("clarin-knext/utterance-rewriting-t5-large", use_auth_token=auth_token),
+        "default_input": DEFAULT_ENCODER_DECODER_INPUT_EN,
+    },
+    "en-mt5-large": {
+        "model": AutoModelForSeq2SeqLM.from_pretrained("clarin-knext/utterance-rewriting-en-mt5-large", use_auth_token=auth_token),
+        "tokenizer": AutoTokenizer.from_pretrained("clarin-knext/utterance-rewriting-en-mt5-large", use_auth_token=auth_token),
+        "default_input": DEFAULT_ENCODER_DECODER_INPUT_EN,
+    },
+    "gpt2": {
+        "model": AutoModelForCausalLM.from_pretrained("clarin-knext/utterance-rewriting-gpt2", use_auth_token=auth_token),
+        "tokenizer": AutoTokenizer.from_pretrained("clarin-knext/utterance-rewriting-gpt2", use_auth_token=auth_token),
+        "default_input": DEFAULT_DECODER_ONLY_INPUT_EN,
+    },
+    "pt5-large": {
+        "model": AutoModelForSeq2SeqLM.from_pretrained("clarin-knext/utterance-rewriting-pt5-large", use_auth_token=auth_token),
+        "tokenizer": AutoTokenizer.from_pretrained("clarin-knext/utterance-rewriting-pt5-large", use_auth_token=auth_token),
+        "default_input": DEFAULT_ENCODER_DECODER_INPUT_PL,
+    },
+    "pl-mt5-large": {
+        "model": AutoModelForSeq2SeqLM.from_pretrained("clarin-knext/utterance-rewriting-pl-mt5-large", use_auth_token=auth_token),
+        "tokenizer": AutoTokenizer.from_pretrained("clarin-knext/utterance-rewriting-pl-mt5-large", use_auth_token=auth_token),
+        "default_input": DEFAULT_ENCODER_DECODER_INPUT_PL,
+    },
+    "polish-gpt2": {
+        "model": AutoModelForCausalLM.from_pretrained("clarin-knext/utterance-rewriting-polish-gpt2", use_auth_token=auth_token),
+        "tokenizer": AutoTokenizer.from_pretrained("clarin-knext/utterance-rewriting-polish-gpt2", use_auth_token=auth_token),
+        "default_input": DEFAULT_DECODER_ONLY_INPUT_PL,
     },
 }
 PIPELINES: Dict[str, Pipeline] = {
     model_name: pipeline(
+        "text2text-generation", model=DST_MODELS[model_name]["model"], tokenizer=DST_MODELS[model_name]["tokenizer"]
     )
+    for model_name in DST_MODELS
 }