joaogante HF staff commited on
Commit
817dcba
1 Parent(s): c93ec2a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -2
app.py CHANGED
@@ -57,8 +57,7 @@ with gr.Blocks() as demo:
57
  "# 🤗 Assisted Generation Demo\n"
58
  f"- Model: {model_id} (INT8, ~7GB)\n"
59
  f"- Assistant Model: {assistant_id} (FP16, ~0.3GB)\n"
60
- "- Running on a T4 GPU\n"
61
- "- Best results are obtained when the model size difference in parameters is >10x"
62
  )
63
 
64
  with gr.Row():
 
57
  "# 🤗 Assisted Generation Demo\n"
58
  f"- Model: {model_id} (INT8, ~7GB)\n"
59
  f"- Assistant Model: {assistant_id} (FP16, ~0.3GB)\n"
60
+ "- Recipe for speedup: a) >10x model size difference in parameters; b) assistant trained similarly; c) CPU is not a bottleneck"
 
61
  )
62
 
63
  with gr.Row():