danielhanchen commited on
Commit
c0d86e6
·
verified ·
1 Parent(s): 4828675

Upload Qwen3MoeForCausalLM

Browse files
config.json CHANGED
@@ -37,7 +37,9 @@
37
  "lm_head",
38
  "multi_modal_projector",
39
  "merger",
40
- "modality_projection"
 
 
41
  ],
42
  "llm_int8_threshold": 6.0,
43
  "load_in_4bit": true,
@@ -51,7 +53,7 @@
51
  "sliding_window": null,
52
  "tie_word_embeddings": false,
53
  "torch_dtype": "bfloat16",
54
- "transformers_version": "4.52.0.dev0",
55
  "unsloth_fixed": true,
56
  "use_cache": true,
57
  "use_sliding_window": false,
 
37
  "lm_head",
38
  "multi_modal_projector",
39
  "merger",
40
+ "modality_projection",
41
+ "router",
42
+ "gate"
43
  ],
44
  "llm_int8_threshold": 6.0,
45
  "load_in_4bit": true,
 
53
  "sliding_window": null,
54
  "tie_word_embeddings": false,
55
  "torch_dtype": "bfloat16",
56
+ "transformers_version": "4.51.3",
57
  "unsloth_fixed": true,
58
  "use_cache": true,
59
  "use_sliding_window": false,
generation_config.json CHANGED
@@ -10,5 +10,5 @@
10
  "temperature": 0.6,
11
  "top_k": 20,
12
  "top_p": 0.95,
13
- "transformers_version": "4.52.0.dev0"
14
  }
 
10
  "temperature": 0.6,
11
  "top_k": 20,
12
  "top_p": 0.95,
13
+ "transformers_version": "4.51.3"
14
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f134a6148997badd2e57c68d76a31113897e650bdee6130f34175b014645289d
3
- size 5003583957
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29dfd81dac895689a0bd25c6ce06b6db2b3be915c11b64037f239d678887cd91
3
+ size 5003311265
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1aa24383012941c0bf52479f873699e11a88273f9a93b706e11c15df6fba29ec
3
- size 5004623123
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73d09943a6b41353742128fee619a3a3498605f4960b81850318eccf880f922b
3
+ size 5004311598
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd7d02e7623fb12135ecc5c8084a1bc10642286af3a6115efbb748ceeb3b823f
3
- size 5004491710
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45c34622e3e4f078fbc072838bc851e90c0f0effd5f4ff6c2ae542a3eddb12ef
3
+ size 5004606290
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ecfd762d434289b7e10499af8011c027845be1cd9c55fbe3602bdd7a11139aa
3
- size 1699698382
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb43d4fcf1adb738c5306e77180f2e4ff835895bf9c0bd3c14db5b3a422b04c5
3
+ size 1718755365
model.safetensors.index.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57036f3967b2cffe3a1c962ee227d93d90b8d11ce9e372a34bfeb4c3fc85000b
3
- size 11572484
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6859142ac2ef5517976903441eb510cb5d9e59027137a60ad10e7dd04790f58
3
+ size 11550790