Update README.md
Browse files
README.md
CHANGED
@@ -15,7 +15,7 @@ This model is an int4 auto-round model with group_size 128 of [Qwen/Qwen2-7B](ht
|
|
15 |
### INT4 Inference
|
16 |
|
17 |
```python
|
18 |
-
##pip install auto-round
|
19 |
from auto_round import AutoRoundConfig ##must import for auto_round format
|
20 |
from transformers import AutoModelForCausalLM,AutoTokenizer
|
21 |
quantized_model_dir = "Intel/Qwen2-7B-int4-inc"
|
|
|
15 |
### INT4 Inference
|
16 |
|
17 |
```python
|
18 |
+
##pip install auto-round (cpu needs version > 0.3.1))
|
19 |
from auto_round import AutoRoundConfig ##must import for auto_round format
|
20 |
from transformers import AutoModelForCausalLM,AutoTokenizer
|
21 |
quantized_model_dir = "Intel/Qwen2-7B-int4-inc"
|