Roger Condori commited on
Commit
fc80b18
1 Parent(s): 0ce15d3

add description restriction maxtokens app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -130,7 +130,7 @@ with gr.Blocks(theme=theme, css=css) as demo:
130
  gr.HTML("<h3>Only models from the GGML library are accepted.</h3>")
131
  repo_ = gr.Textbox(label="Repository" ,value="TheBloke/Llama-2-7B-Chat-GGML")
132
  file_ = gr.Textbox(label="File name" ,value="llama-2-7b-chat.ggmlv3.q2_K.bin")
133
- max_tokens = gr.inputs.Slider(1, MAX_NEW_TOKENS, default=16, label="Max new tokens", step=1)
134
  temperature = gr.inputs.Slider(0.1, 1., default=0.2, label="Temperature", step=0.1)
135
  top_k = gr.inputs.Slider(0.01, 1., default=0.95, label="Top K", step=0.01)
136
  top_p = gr.inputs.Slider(0, 100, default=50, label="Top P", step=1)
 
130
  gr.HTML("<h3>Only models from the GGML library are accepted.</h3>")
131
  repo_ = gr.Textbox(label="Repository" ,value="TheBloke/Llama-2-7B-Chat-GGML")
132
  file_ = gr.Textbox(label="File name" ,value="llama-2-7b-chat.ggmlv3.q2_K.bin")
133
+ max_tokens = gr.inputs.Slider(1, MAX_NEW_TOKENS, default=16, label="Max new tokens; Limited due to excessively long inference times, use Colab or local to avoid these restrictions.", step=1)
134
  temperature = gr.inputs.Slider(0.1, 1., default=0.2, label="Temperature", step=0.1)
135
  top_k = gr.inputs.Slider(0.01, 1., default=0.95, label="Top K", step=0.01)
136
  top_p = gr.inputs.Slider(0, 100, default=50, label="Top P", step=1)