Add FP8 dynamically quantized Qwen3-0.6B-Base model using llm-compressor
Browse files- config.json +1 -1
- generation_config.json +1 -1
- model.safetensors +1 -1
config.json
CHANGED
@@ -65,7 +65,7 @@
|
|
65 |
"sliding_window": null,
|
66 |
"tie_word_embeddings": true,
|
67 |
"torch_dtype": "bfloat16",
|
68 |
-
"transformers_version": "4.52.
|
69 |
"use_cache": true,
|
70 |
"use_sliding_window": false,
|
71 |
"vocab_size": 151936
|
|
|
65 |
"sliding_window": null,
|
66 |
"tie_word_embeddings": true,
|
67 |
"torch_dtype": "bfloat16",
|
68 |
+
"transformers_version": "4.52.4",
|
69 |
"use_cache": true,
|
70 |
"use_sliding_window": false,
|
71 |
"vocab_size": 151936
|
generation_config.json
CHANGED
@@ -2,5 +2,5 @@
|
|
2 |
"bos_token_id": 151643,
|
3 |
"eos_token_id": 151643,
|
4 |
"max_new_tokens": 2048,
|
5 |
-
"transformers_version": "4.52.
|
6 |
}
|
|
|
2 |
"bos_token_id": 151643,
|
3 |
"eos_token_id": 151643,
|
4 |
"max_new_tokens": 2048,
|
5 |
+
"transformers_version": "4.52.4"
|
6 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1069802016
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9df3b1dc1785115e8b679849372d1a5d5abc85573495458f96d060d926f23cfb
|
3 |
size 1069802016
|