JRosenkranz commited on
Commit
8c8a362
1 Parent(s): a68ddb6

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -46,7 +46,7 @@ docker run -d --rm --gpus all \
46
  -p 8033:8033 \
47
  -v /path/to/all/models:/models \
48
  -e MODEL_NAME=/models/model_weights/llama/13B-F \
49
- -e SPECULATOR_NAME=ibm-fms/llama-13b-accelerator \
50
  -e FLASH_ATTENTION=true \
51
  -e PAGED_ATTENTION=true \
52
  -e DTYPE_STR=float16 \
 
46
  -p 8033:8033 \
47
  -v /path/to/all/models:/models \
48
  -e MODEL_NAME=/models/model_weights/llama/13B-F \
49
+ -e SPECULATOR_NAME=/models/speculator_weights/llama/llama-13b-accelerator \
50
  -e FLASH_ATTENTION=true \
51
  -e PAGED_ATTENTION=true \
52
  -e DTYPE_STR=float16 \