JRosenkranz
commited on
Commit
•
510bfdb
1
Parent(s):
8ac38c5
Update README.md
Browse files
README.md
CHANGED
@@ -135,7 +135,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
135 |
--model_path=$MODEL_PATH \
|
136 |
--model_source=hf \
|
137 |
--tokenizer=$MODEL_PATH \
|
138 |
-
--speculator_path=ibm-fms/
|
139 |
--speculator_source=hf \
|
140 |
--speculator_variant=3_2b \
|
141 |
--top_k_tokens_per_head=4,3,2,2 \
|
@@ -153,7 +153,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
153 |
--model_path=$MODEL_PATH \
|
154 |
--model_source=hf \
|
155 |
--tokenizer=$MODEL_PATH \
|
156 |
-
--speculator_path=ibm-fms/
|
157 |
--speculator_source=hf \
|
158 |
--speculator_variant=3_2b \
|
159 |
--top_k_tokens_per_head=4,3,2,2 \
|
@@ -170,7 +170,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
170 |
--model_path=$MODEL_PATH \
|
171 |
--model_source=hf \
|
172 |
--tokenizer=$MODEL_PATH \
|
173 |
-
--speculator_path=ibm-fms/
|
174 |
--speculator_source=hf \
|
175 |
--speculator_variant=3_2b \
|
176 |
--top_k_tokens_per_head=4,3,2,2 \
|
|
|
135 |
--model_path=$MODEL_PATH \
|
136 |
--model_source=hf \
|
137 |
--tokenizer=$MODEL_PATH \
|
138 |
+
--speculator_path=ibm-fms/llama3-8b-accelerator \
|
139 |
--speculator_source=hf \
|
140 |
--speculator_variant=3_2b \
|
141 |
--top_k_tokens_per_head=4,3,2,2 \
|
|
|
153 |
--model_path=$MODEL_PATH \
|
154 |
--model_source=hf \
|
155 |
--tokenizer=$MODEL_PATH \
|
156 |
+
--speculator_path=ibm-fms/llama3-8b-accelerator \
|
157 |
--speculator_source=hf \
|
158 |
--speculator_variant=3_2b \
|
159 |
--top_k_tokens_per_head=4,3,2,2 \
|
|
|
170 |
--model_path=$MODEL_PATH \
|
171 |
--model_source=hf \
|
172 |
--tokenizer=$MODEL_PATH \
|
173 |
+
--speculator_path=ibm-fms/llama3-8b-accelerator \
|
174 |
--speculator_source=hf \
|
175 |
--speculator_variant=3_2b \
|
176 |
--top_k_tokens_per_head=4,3,2,2 \
|