Spaces:

pszemraj
/

ballpark-trivia

Runtime error

App Files Files Community

peter szemraj commited on Dec 31, 2021

Commit

2979040

•

1 Parent(s): 5b5e54c

reset model back to size L because XL breaks things

Browse files

Files changed (2) hide show

ai_single_response.py +18 -21
app.py +3 -0

ai_single_response.py CHANGED Viewed

@@ -16,6 +16,7 @@ import time
 import warnings
 from datetime import datetime
 from pathlib import Path
 from utils import print_spacer, cleantxt_wrap
 warnings.filterwarnings(action="ignore", message=".*gradient_checkpointing*")
@@ -118,27 +119,24 @@ def query_gpt_model(
     use_gpu=False,
 ):
     """
-    query_gpt_model [pass a prompt in to model, get a response. Does NOT "remember" past conversation]
-    Args:
-        folder_path ([type]): [description]
-        prompt_msg (str): [description]
-        speaker ([type], optional): [description]. Defaults to None.
-        responder (str, optional): [description]. Defaults to None.
-        resp_length (int, optional): [description]. Defaults to 128.
-        resp_min (int, optional): [description]. Defaults to 4.
-        kparam (int, optional): [description]. Defaults to 50.
-        temp (float, optional): [description]. Defaults to 0.75.
-        top_p (float, optional): [description]. Defaults to 0.65.
-        verbose (bool, optional): [description]. Defaults to False.
-        use_gpu (bool, optional): [description]. Defaults to False.
-    Returns:
-        [dict]: [returns a dict with A) just model response as str B) total conversation]
     """
     ai = aitextgen(
-        # model="pszemraj/Ballpark-Trivia-L", # THIS WORKS
-        model="pszemraj/Ballpark-Trivia-XL",
         to_gpu=use_gpu,
     )
@@ -187,8 +185,7 @@ def query_gpt_model(
     bot_resp = ", ".join(bot_dialogue)
     bot_resp = bot_resp.strip()
     # remove the last ',' '.' chars
-    bot_resp = bot_resp[:-1] if bot_resp.endswith(".") else bot_resp
-    bot_resp = bot_resp[:-1] if bot_resp.endswith(",") else bot_resp
     if verbose:
         print("\n... bot response:\n")
         pp.pprint(bot_resp)

 import warnings
 from datetime import datetime
 from pathlib import Path
+from grammar_improve import remove_trailing_punctuation
 from utils import print_spacer, cleantxt_wrap
 warnings.filterwarnings(action="ignore", message=".*gradient_checkpointing*")
     use_gpu=False,
 ):
     """
+    query_gpt_model - the main function that calls the model.
+    Parameters:
+    -----------
+    prompt_msg (str): the prompt to be sent to the model
+    speaker (str, optional): the name of the speaker. Defaults to None.
+    responder (str, optional): the name of the responder. Defaults to None.
+    resp_length (int, optional): the length of the response. Defaults to 128.
+    resp_min (int, optional): the minimum length of the response. Defaults to 4.
+    kparam (int, optional): the k parameter for the top_p. Defaults to 150.
+    temp (float, optional): the temperature for the top_p. Defaults to 0.75.
+    top_p (float, optional): the top_p parameter for the top_p. Defaults to 0.65.
+    verbose (bool, optional): 4 debug. Defaults to False.
+    use_gpu (bool, optional): use gpu. Defaults to False.
     """
     ai = aitextgen(
+        model="pszemraj/Ballpark-Trivia-L", # THIS WORKS
+        # model="pszemraj/Ballpark-Trivia-XL", # does not seem to work
         to_gpu=use_gpu,
     )
     bot_resp = ", ".join(bot_dialogue)
     bot_resp = bot_resp.strip()
     # remove the last ',' '.' chars
+    bot_resp = remove_trailing_punctuation(bot_resp)
     if verbose:
         print("\n... bot response:\n")
         pp.pprint(bot_resp)

app.py CHANGED Viewed

@@ -153,6 +153,7 @@ if __name__ == "__main__":
         chat,
         inputs=["text"],
         outputs="html",
         title=f"Ballpark Trivia: {default_model} Model",
         description=f"Are you frequently asked google-able Trivia questions and annoyed by it? Well, this is the app for you! Ballpark Trivia Bot answers any trivia question with something that sounds plausible but is probably not 100% correct. \n\n One might say.. the answers are in the right ballpark.",
         article="Further details can be found in the [model card](https://huggingface.co/pszemraj/Ballpark-Trivia-L).  If you are interested in a more deceptively incorrect model, there is also [an XL version](https://huggingface.co/pszemraj/Ballpark-Trivia-XL) on my page.\n\n"
@@ -165,6 +166,7 @@ if __name__ == "__main__":
         .user_msg {background-color:cornflowerblue;color:white;align-self:start}
         .resp_msg {background-color:lightgray;align-self:self-end}
     """,
         allow_screenshot=True,
         allow_flagging=False,
         enable_queue=True,  # allows for dealing with multiple users simultaneously
@@ -175,4 +177,5 @@ if __name__ == "__main__":
     iface.launch(
         share=True,
         enable_queue=True,  # also allows for dealing with multiple users simultaneously (per newer gradio version)
     )

         chat,
         inputs=["text"],
         outputs="html",
+        examples=["when was Katy Perry born?"],
         title=f"Ballpark Trivia: {default_model} Model",
         description=f"Are you frequently asked google-able Trivia questions and annoyed by it? Well, this is the app for you! Ballpark Trivia Bot answers any trivia question with something that sounds plausible but is probably not 100% correct. \n\n One might say.. the answers are in the right ballpark.",
         article="Further details can be found in the [model card](https://huggingface.co/pszemraj/Ballpark-Trivia-L).  If you are interested in a more deceptively incorrect model, there is also [an XL version](https://huggingface.co/pszemraj/Ballpark-Trivia-XL) on my page.\n\n"
         .user_msg {background-color:cornflowerblue;color:white;align-self:start}
         .resp_msg {background-color:lightgray;align-self:self-end}
     """,
+        live=True,
         allow_screenshot=True,
         allow_flagging=False,
         enable_queue=True,  # allows for dealing with multiple users simultaneously
     iface.launch(
         share=True,
         enable_queue=True,  # also allows for dealing with multiple users simultaneously (per newer gradio version)
+        show_tips=True,
     )