JRosenkranz
commited on
Commit
•
3cb2f95
1
Parent(s):
0f37d3d
Update README.md
Browse files
README.md
CHANGED
@@ -89,7 +89,7 @@ pip install transformers==4.35.0 sentencepiece numpy
|
|
89 |
##### batch_size=1 (compile + cudagraphs)
|
90 |
|
91 |
```bash
|
92 |
-
MODEL_PATH=/path/to/llama/13B-F
|
93 |
python fms-extras/scripts/paged_speculative_inference.py \
|
94 |
--variant=13b \
|
95 |
--model_path=$MODEL_PATH \
|
@@ -104,7 +104,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
104 |
##### batch_size=1 (compile)
|
105 |
|
106 |
```bash
|
107 |
-
MODEL_PATH=/path/to/llama/13B-F
|
108 |
python fms-extras/scripts/paged_speculative_inference.py \
|
109 |
--variant=13b \
|
110 |
--model_path=$MODEL_PATH \
|
@@ -118,7 +118,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
118 |
##### batch_size=4 (compile)
|
119 |
|
120 |
```bash
|
121 |
-
MODEL_PATH=/path/to/llama/13B-F
|
122 |
python fms-extras/scripts/paged_speculative_inference.py \
|
123 |
--variant=13b \
|
124 |
--model_path=$MODEL_PATH \
|
|
|
89 |
##### batch_size=1 (compile + cudagraphs)
|
90 |
|
91 |
```bash
|
92 |
+
MODEL_PATH=/path/to/llama/hf/13B-F
|
93 |
python fms-extras/scripts/paged_speculative_inference.py \
|
94 |
--variant=13b \
|
95 |
--model_path=$MODEL_PATH \
|
|
|
104 |
##### batch_size=1 (compile)
|
105 |
|
106 |
```bash
|
107 |
+
MODEL_PATH=/path/to/llama/hf/13B-F
|
108 |
python fms-extras/scripts/paged_speculative_inference.py \
|
109 |
--variant=13b \
|
110 |
--model_path=$MODEL_PATH \
|
|
|
118 |
##### batch_size=4 (compile)
|
119 |
|
120 |
```bash
|
121 |
+
MODEL_PATH=/path/to/llama/hf/13B-F
|
122 |
python fms-extras/scripts/paged_speculative_inference.py \
|
123 |
--variant=13b \
|
124 |
--model_path=$MODEL_PATH \
|