mwitiderrick
commited on
Commit
•
22ff818
1
Parent(s):
4e2bc8e
Update README.md
Browse files
README.md
CHANGED
@@ -20,7 +20,7 @@ Run in a Python pipeline for local inference:
|
|
20 |
```python
|
21 |
from vllm import LLM, SamplingParams
|
22 |
|
23 |
-
model = LLM("nm-testing/TinyLlama-1.1B-Chat-v1.0-pruned2.4", sparsity="
|
24 |
prompt = "How to make banana bread?"
|
25 |
formatted_prompt = f"<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant\n"
|
26 |
|
|
|
20 |
```python
|
21 |
from vllm import LLM, SamplingParams
|
22 |
|
23 |
+
model = LLM("nm-testing/TinyLlama-1.1B-Chat-v1.0-pruned2.4", sparsity="semi_structured_sparse_w16a16")
|
24 |
prompt = "How to make banana bread?"
|
25 |
formatted_prompt = f"<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant\n"
|
26 |
|