h2ogpt-chatbot2

Runtime error

App Files Files Community

pseudotensor commited on Jul 14, 2023

Commit

b64f5c9

•

1 Parent(s): edf6dca

Update with h2oGPT hash 69842ebb9decb32f33bd06c4e6e3bd9c5fb4a7ab

Browse files

Files changed (3) hide show

gen.py +9 -7
gpt_langchain.py +2 -1
gradio_runner.py +5 -3

gen.py CHANGED Viewed

@@ -403,13 +403,13 @@ def main(
     # auto-set langchain_mode
     if have_langchain and langchain_mode is None:
         if allow_upload_to_user_data and not is_public and user_path:
-            langchain_mode = 'UserData'
-            print("Auto set langchain_mode=%s" % langchain_mode, flush=True)
         elif allow_upload_to_my_data:
-            langchain_mode = 'MyData'
-            print("Auto set langchain_mode=%s."
-                  "  To use UserData to pull files from disk,"
                   " set user_path and ensure allow_upload_to_user_data=True" % langchain_mode, flush=True)
         else:
             raise RuntimeError("Please pass --langchain_mode=<chosen mode> out of %s" % langchain_modes)
@@ -1555,7 +1555,8 @@ def evaluate(
             where_from = "openai_client"
             openai.api_key = os.getenv("OPENAI_API_KEY")
-            stop_sequences = list(set(prompter.terminate_response + [prompter.PreResponse]))
             stop_sequences = [x for x in stop_sequences if x]
             # OpenAI will complain if ask for too many new tokens, takes it as min in some sense, wrongly so.
             max_new_tokens_openai = min(max_new_tokens, model_max_length - num_prompt_tokens)
@@ -1764,7 +1765,8 @@ def evaluate(
                 # prompt must include all human-bot like tokens, already added by prompt
                 # https://github.com/huggingface/text-generation-inference/tree/main/clients/python#types
-                stop_sequences = list(set(prompter.terminate_response + [prompter.PreResponse]))
                 stop_sequences = [x for x in stop_sequences if x]
                 gen_server_kwargs = dict(do_sample=do_sample,
                                          max_new_tokens=max_new_tokens,

     # auto-set langchain_mode
     if have_langchain and langchain_mode is None:
+        # start in chat mode, in case just want to chat and don't want to get "No documents to query" by default.
+        langchain_mode = LangChainMode.CHAT_LLM.value
         if allow_upload_to_user_data and not is_public and user_path:
+            print("Auto set langchain_mode=%s.  Could use UserData instead." % langchain_mode, flush=True)
         elif allow_upload_to_my_data:
+            print("Auto set langchain_mode=%s.  Could use MyData instead."
+                  "  To allow UserData to pull files from disk,"
                   " set user_path and ensure allow_upload_to_user_data=True" % langchain_mode, flush=True)
         else:
             raise RuntimeError("Please pass --langchain_mode=<chosen mode> out of %s" % langchain_modes)
             where_from = "openai_client"
             openai.api_key = os.getenv("OPENAI_API_KEY")
+            terminate_response = prompter.terminate_response or []
+            stop_sequences = list(set(terminate_response + [prompter.PreResponse]))
             stop_sequences = [x for x in stop_sequences if x]
             # OpenAI will complain if ask for too many new tokens, takes it as min in some sense, wrongly so.
             max_new_tokens_openai = min(max_new_tokens, model_max_length - num_prompt_tokens)
                 # prompt must include all human-bot like tokens, already added by prompt
                 # https://github.com/huggingface/text-generation-inference/tree/main/clients/python#types
+                terminate_response = prompter.terminate_response or []
+                stop_sequences = list(set(terminate_response + [prompter.PreResponse]))
                 stop_sequences = [x for x in stop_sequences if x]
                 gen_server_kwargs = dict(do_sample=do_sample,
                                          max_new_tokens=max_new_tokens,

gpt_langchain.py CHANGED Viewed

@@ -643,7 +643,8 @@ def get_llm(use_openai_model=False,
         callbacks = [StreamingGradioCallbackHandler()]
         assert prompter is not None
-        stop_sequences = list(set(prompter.terminate_response + [prompter.PreResponse]))
         stop_sequences = [x for x in stop_sequences if x]
         if gr_client:

         callbacks = [StreamingGradioCallbackHandler()]
         assert prompter is not None
+        terminate_response = prompter.terminate_response or []
+        stop_sequences = list(set(terminate_response + [prompter.PreResponse]))
         stop_sequences = [x for x in stop_sequences if x]
         if gr_client:

gradio_runner.py CHANGED Viewed

@@ -434,6 +434,7 @@ def go_gradio(**kwargs):
                                                   value='All',
                                                   interactive=True,
                                                   multiselect=True,
                                                   )
                     sources_visible = kwargs['langchain_mode'] != 'Disabled' and enable_sources_list
                     with gr.Row():
@@ -454,10 +455,11 @@ def go_gradio(**kwargs):
                         with gr.Column(scale=2):
                             sources_text = gr.HTML(label='Sources Added', interactive=False)
-                    doc_exception_text = gr.Textbox(value="", visible=True, label='Document Exceptions',
-                                                    interactive=False)
                 with gr.TabItem("Document Viewer"):
-                    with gr.Row():
                         with gr.Column(scale=2):
                             get_viewable_sources_btn = gr.Button(value="Update UI with Document(s) from DB", scale=0,
                                                                  size='sm',

                                                   value='All',
                                                   interactive=True,
                                                   multiselect=True,
+                                                  visible=kwargs['langchain_mode'] != 'Disabled',
                                                   )
                     sources_visible = kwargs['langchain_mode'] != 'Disabled' and enable_sources_list
                     with gr.Row():
                         with gr.Column(scale=2):
                             sources_text = gr.HTML(label='Sources Added', interactive=False)
+                    doc_exception_text = gr.Textbox(value="", label='Document Exceptions',
+                                                    interactive=False,
+                                                    visible=kwargs['langchain_mode'] != 'Disabled')
                 with gr.TabItem("Document Viewer"):
+                    with gr.Row(visible=kwargs['langchain_mode'] != 'Disabled'):
                         with gr.Column(scale=2):
                             get_viewable_sources_btn = gr.Button(value="Update UI with Document(s) from DB", scale=0,
                                                                  size='sm',