ljsabc commited on
Commit
fb89707
1 Parent(s): 03fcc17

Reserve answer space for long tokens; paramter test.

Browse files
Files changed (1) hide show
  1. app.py +8 -2
app.py CHANGED
@@ -84,10 +84,16 @@ def evaluate_stream(msg, history, temperature, top_p):
84
  context += history[-1][0]
85
  context = context.replace(r'<br>', '')
86
 
 
 
 
 
 
 
87
  h = []
88
  print("History:", history)
89
  print("Context:", context)
90
- for response, h in model.stream_chat(tokenizer, context, h, max_length=160, top_p=top_p, temperature=temperature):
91
  history[-1][1] = response
92
  yield history, ""
93
 
@@ -108,7 +114,7 @@ with gr.Blocks() as demo:
108
  with gr.Column(scale=2):
109
  temp = gr.components.Slider(minimum=0, maximum=1.1, value=0.95, label="Temperature",
110
  info="温度参数,越高的温度生成的内容越丰富,但是有可能出现语法问题。")
111
- top_p = gr.components.Slider(minimum=0.5, maximum=1.0, value=0.99, label="Top-p",
112
  info="top-p参数,只输出前p>top-p的文字,越大生成的内容越丰富,但也可能出现语法问题。数字越小似乎上下文的衔接性越好。")
113
  #code = gr.Textbox(label="temp_output", info="解码器输出")
114
  #top_k = gr.components.Slider(minimum=1, maximum=200, step=1, value=25, label="Top k",
 
84
  context += history[-1][0]
85
  context = context.replace(r'<br>', '')
86
 
87
+ # TODO: Avoid the tokens are too long.
88
+ CUTOFF = 160
89
+ while tokenizer.encode(context) > CUTOFF:
90
+ # save 15 token size for the answer
91
+ context = context[15:]
92
+
93
  h = []
94
  print("History:", history)
95
  print("Context:", context)
96
+ for response, h in model.stream_chat(tokenizer, context, h, max_length=CUTOFF, top_p=top_p, temperature=temperature):
97
  history[-1][1] = response
98
  yield history, ""
99
 
 
114
  with gr.Column(scale=2):
115
  temp = gr.components.Slider(minimum=0, maximum=1.1, value=0.95, label="Temperature",
116
  info="温度参数,越高的温度生成的内容越丰富,但是有可能出现语法问题。")
117
+ top_p = gr.components.Slider(minimum=0.5, maximum=1.0, value=0.9, label="Top-p",
118
  info="top-p参数,只输出前p>top-p的文字,越大生成的内容越丰富,但也可能出现语法问题。数字越小似乎上下文的衔接性越好。")
119
  #code = gr.Textbox(label="temp_output", info="解码器输出")
120
  #top_k = gr.components.Slider(minimum=1, maximum=200, step=1, value=25, label="Top k",