Spaces:
Runtime error
Runtime error
duplicte code b/c gradio is really wonky
Browse files
app.py
CHANGED
@@ -304,7 +304,7 @@ def open_user(message, nudge_msg, history):
|
|
304 |
return "", nudge_msg, history
|
305 |
|
306 |
|
307 |
-
def open_chat(model_name, history, system_msg, max_new_tokens, temperature, top_p, top_k, repetition_penalty
|
308 |
history = history or []
|
309 |
|
310 |
model = get_model_pipeline(model_name)
|
@@ -332,8 +332,32 @@ def open_chat(model_name, history, system_msg, max_new_tokens, temperature, top_
|
|
332 |
sleep(0.01)
|
333 |
|
334 |
|
335 |
-
def open_rp_chat(
|
336 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
337 |
|
338 |
|
339 |
with gr.Blocks() as arena:
|
|
|
304 |
return "", nudge_msg, history
|
305 |
|
306 |
|
307 |
+
def open_chat(model_name, history, system_msg, max_new_tokens, temperature, top_p, top_k, repetition_penalty):
|
308 |
history = history or []
|
309 |
|
310 |
model = get_model_pipeline(model_name)
|
|
|
332 |
sleep(0.01)
|
333 |
|
334 |
|
335 |
+
def open_rp_chat(model_name, history, system_msg, max_new_tokens, temperature, top_p, top_k, repetition_penalty):
|
336 |
+
history = history or []
|
337 |
+
|
338 |
+
model = get_model_pipeline(f"{model_name}-roleplay")
|
339 |
+
config = model.get_generation_config()
|
340 |
+
config["max_new_tokens"] = max_new_tokens
|
341 |
+
config["temperature"] = temperature
|
342 |
+
config["temperature"] = temperature
|
343 |
+
config["top_p"] = top_p
|
344 |
+
config["top_k"] = top_k
|
345 |
+
config["repetition_penalty"] = repetition_penalty
|
346 |
+
|
347 |
+
messages = model.transform_prompt(system_msg, history)
|
348 |
+
|
349 |
+
# remove last space from assistant, some models output a ZWSP if you leave a space
|
350 |
+
messages = messages.rstrip()
|
351 |
+
|
352 |
+
model_res = model(messages, config=config) # type: Generator[List[Dict[str, str]], None, None]
|
353 |
+
for res in model_res:
|
354 |
+
tokens = re.findall(r'\s*\S+\s*', res[0]['generated_text'])
|
355 |
+
for s in tokens:
|
356 |
+
answer = s
|
357 |
+
history[-1][1] += answer
|
358 |
+
# stream the response
|
359 |
+
yield history, history, ""
|
360 |
+
sleep(0.01)
|
361 |
|
362 |
|
363 |
with gr.Blocks() as arena:
|