mwitiderrick
commited on
Commit
•
9ecef0e
1
Parent(s):
fc3f2b9
Update README.md
Browse files
README.md
CHANGED
@@ -22,7 +22,7 @@ Run in a Python pipeline for local inference:
|
|
22 |
```python
|
23 |
from vllm import LLM, SamplingParams
|
24 |
|
25 |
-
model = LLM("nm-testing/Nous-Hermes-2-Yi-34B-
|
26 |
prompt = "How to make banana bread?"
|
27 |
formatted_prompt = f"<|im_start|>User:{prompt}\n<|im_start|>assistant:\n"
|
28 |
|
|
|
22 |
```python
|
23 |
from vllm import LLM, SamplingParams
|
24 |
|
25 |
+
model = LLM("nm-testing/Nous-Hermes-2-Yi-34B-pruned50", sparsity="sparse_w16a16")
|
26 |
prompt = "How to make banana bread?"
|
27 |
formatted_prompt = f"<|im_start|>User:{prompt}\n<|im_start|>assistant:\n"
|
28 |
|