Spaces:

routellm
/

demo

Runtime error

iojw commited on Jul 8

Commit

a3fd1d5

•

1 Parent(s): d51b0f1

Update mistral name

Files changed (1) hide show

app.py CHANGED Viewed

@@ -45,7 +45,11 @@ def predict(message, history, threshold, temperature):
     for i, chunk in enumerate(stream):
         print(chunk)
         if i == 0:
-            model_prefix = f"**[{chunk.model}]**\n"
             yield model_prefix
             partial_message += model_prefix
         partial_message += chunk.choices[0].delta.content or ""
@@ -62,6 +66,7 @@ demo = gr.ChatInterface(
         ),
     ],
     title="RouteLLM",
     description="This is a demo of our matrix factorization router, calibrated so that approximately 50% of calls (those that are harder) are routed to GPT-4, with remaining calls routed to Mixtral 8x7B.\n\nCheck out https://github.com/lm-sys/RouteLLM for details!",
 )

     for i, chunk in enumerate(stream):
         print(chunk)
         if i == 0:
+            if chunk.model == "mistralai/Mixtral-8x7B-Instruct-v0.1":
+                model_name = "Mixtral-8x7B-Instruct-v0.1"
+            else:
+                model_name = chunk.model
+            model_prefix = f"**[{model_name}]**\n"
             yield model_prefix
             partial_message += model_prefix
         partial_message += chunk.choices[0].delta.content or ""
         ),
     ],
     title="RouteLLM",
+    fill_height=True,
     description="This is a demo of our matrix factorization router, calibrated so that approximately 50% of calls (those that are harder) are routed to GPT-4, with remaining calls routed to Mixtral 8x7B.\n\nCheck out https://github.com/lm-sys/RouteLLM for details!",
 )