Update README.md
Browse files
README.md
CHANGED
|
@@ -135,7 +135,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
| 135 |
--model_path=$MODEL_PATH \
|
| 136 |
--model_source=hf \
|
| 137 |
--tokenizer=$MODEL_PATH \
|
| 138 |
-
--speculator_path=ibm-fms/
|
| 139 |
--speculator_source=hf \
|
| 140 |
--speculator_variant=3_2b \
|
| 141 |
--top_k_tokens_per_head=4,3,2,2 \
|
|
@@ -153,7 +153,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
| 153 |
--model_path=$MODEL_PATH \
|
| 154 |
--model_source=hf \
|
| 155 |
--tokenizer=$MODEL_PATH \
|
| 156 |
-
--speculator_path=ibm-fms/
|
| 157 |
--speculator_source=hf \
|
| 158 |
--speculator_variant=3_2b \
|
| 159 |
--top_k_tokens_per_head=4,3,2,2 \
|
|
@@ -170,7 +170,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
| 170 |
--model_path=$MODEL_PATH \
|
| 171 |
--model_source=hf \
|
| 172 |
--tokenizer=$MODEL_PATH \
|
| 173 |
-
--speculator_path=ibm-fms/
|
| 174 |
--speculator_source=hf \
|
| 175 |
--speculator_variant=3_2b \
|
| 176 |
--top_k_tokens_per_head=4,3,2,2 \
|
|
|
|
| 135 |
--model_path=$MODEL_PATH \
|
| 136 |
--model_source=hf \
|
| 137 |
--tokenizer=$MODEL_PATH \
|
| 138 |
+
--speculator_path=ibm-fms/llama3-8b-accelerator \
|
| 139 |
--speculator_source=hf \
|
| 140 |
--speculator_variant=3_2b \
|
| 141 |
--top_k_tokens_per_head=4,3,2,2 \
|
|
|
|
| 153 |
--model_path=$MODEL_PATH \
|
| 154 |
--model_source=hf \
|
| 155 |
--tokenizer=$MODEL_PATH \
|
| 156 |
+
--speculator_path=ibm-fms/llama3-8b-accelerator \
|
| 157 |
--speculator_source=hf \
|
| 158 |
--speculator_variant=3_2b \
|
| 159 |
--top_k_tokens_per_head=4,3,2,2 \
|
|
|
|
| 170 |
--model_path=$MODEL_PATH \
|
| 171 |
--model_source=hf \
|
| 172 |
--tokenizer=$MODEL_PATH \
|
| 173 |
+
--speculator_path=ibm-fms/llama3-8b-accelerator \
|
| 174 |
--speculator_source=hf \
|
| 175 |
--speculator_variant=3_2b \
|
| 176 |
--top_k_tokens_per_head=4,3,2,2 \
|