CarlOwOs commited on
Commit
0a3e19f
·
verified ·
1 Parent(s): 34e054c

Add FP8 dynamically quantized Qwen3-0.6B-Base model using llm-compressor

Browse files
Files changed (3) hide show
  1. config.json +1 -1
  2. generation_config.json +1 -1
  3. model.safetensors +1 -1
config.json CHANGED
@@ -65,7 +65,7 @@
65
  "sliding_window": null,
66
  "tie_word_embeddings": true,
67
  "torch_dtype": "bfloat16",
68
- "transformers_version": "4.52.3",
69
  "use_cache": true,
70
  "use_sliding_window": false,
71
  "vocab_size": 151936
 
65
  "sliding_window": null,
66
  "tie_word_embeddings": true,
67
  "torch_dtype": "bfloat16",
68
+ "transformers_version": "4.52.4",
69
  "use_cache": true,
70
  "use_sliding_window": false,
71
  "vocab_size": 151936
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "bos_token_id": 151643,
3
  "eos_token_id": 151643,
4
  "max_new_tokens": 2048,
5
- "transformers_version": "4.52.3"
6
  }
 
2
  "bos_token_id": 151643,
3
  "eos_token_id": 151643,
4
  "max_new_tokens": 2048,
5
+ "transformers_version": "4.52.4"
6
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93b9e00ceea769d885151d1c6a331fe8fffa4d0f3d8bfb7a3d9cafd93fd2a889
3
  size 1069802016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9df3b1dc1785115e8b679849372d1a5d5abc85573495458f96d060d926f23cfb
3
  size 1069802016