Update README.md
Browse files
README.md
CHANGED
@@ -16,7 +16,7 @@ This model is an int4 model symmetric quantized with group_size 128 of [Qwen/Qwe
|
|
16 |
### INT4 CPU/CUDA Inference
|
17 |
|
18 |
```python
|
19 |
-
## pip install auto-round
|
20 |
from auto_round import AutoRoundConfig ##must import for auto-round format
|
21 |
import torch
|
22 |
from transformers import AutoModelForCausalLM,AutoTokenizer
|
|
|
16 |
### INT4 CPU/CUDA Inference
|
17 |
|
18 |
```python
|
19 |
+
## pip install auto-round (cpu needs version > 0.3.1)
|
20 |
from auto_round import AutoRoundConfig ##must import for auto-round format
|
21 |
import torch
|
22 |
from transformers import AutoModelForCausalLM,AutoTokenizer
|