ffreemt commited on
Commit
f073be5
1 Parent(s): b01b8ee

Adjust queue size

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -377,8 +377,8 @@ with gr.Blocks(title="ChatGLM2-6B-int4", theme=gr.themes.Soft(text_size="sm")) a
377
  # demo.queue().launch(share=True, inbrowser=True, debug=True)
378
 
379
  # concurrency_count > 1 requires more memory, max_size: queue size
380
- # T4 medium: 30GB, model size: ~6G concurrency_count = 3
381
  # leave one for api access
382
- # reduce to 3 if OOM
383
 
384
- demo.queue(concurrency_count=4, max_size=20).launch(debug=True)
 
377
  # demo.queue().launch(share=True, inbrowser=True, debug=True)
378
 
379
  # concurrency_count > 1 requires more memory, max_size: queue size
380
+ # T4 medium: 30GB, model size: ~4G concurrency_count = 6
381
  # leave one for api access
382
+ # reduce to 5 if OOM occurs to often
383
 
384
+ demo.queue(concurrency_count=6, max_size=30).launch(debug=True)