yentinglin commited on
Commit
7a3d937
1 Parent(s): 07ac9a2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -60,7 +60,7 @@ endpoint_url = os.environ.get("ENDPOINT_URL", "http://127.0.0.1:8080")
60
  client = Client(endpoint_url, timeout=120)
61
  eos_token = "</s>"
62
  MAX_MAX_NEW_TOKENS = 1024
63
- DEFAULT_MAX_NEW_TOKENS = 256
64
 
65
  max_prompt_length = 4096 - MAX_MAX_NEW_TOKENS - 10
66
 
@@ -237,5 +237,5 @@ with gr.Blocks() as demo:
237
 
238
  gr.Markdown(LICENSE)
239
 
240
- demo.queue(max_size=128)
241
  demo.launch()
 
60
  client = Client(endpoint_url, timeout=120)
61
  eos_token = "</s>"
62
  MAX_MAX_NEW_TOKENS = 1024
63
+ DEFAULT_MAX_NEW_TOKENS = 1024
64
 
65
  max_prompt_length = 4096 - MAX_MAX_NEW_TOKENS - 10
66
 
 
237
 
238
  gr.Markdown(LICENSE)
239
 
240
+ demo.queue(concurrency_count=4, max_size=128)
241
  demo.launch()