Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- merges.txt +0 -0
- mlc-chat-config.json +91 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,91 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen3_moe",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 4096,
|
8 |
+
"intermediate_size": 12288,
|
9 |
+
"attention_bias": false,
|
10 |
+
"num_attention_heads": 64,
|
11 |
+
"num_hidden_layers": 94,
|
12 |
+
"num_key_value_heads": 4,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"rope_theta": 1000000.0,
|
15 |
+
"vocab_size": 151936,
|
16 |
+
"tie_word_embeddings": false,
|
17 |
+
"context_window_size": 40960,
|
18 |
+
"prefill_chunk_size": 2048,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"head_dim": 128,
|
21 |
+
"dtype": "float32",
|
22 |
+
"max_batch_size": 128,
|
23 |
+
"weight_block_size": null,
|
24 |
+
"moe_intermediate_size": 1536,
|
25 |
+
"num_experts_per_tok": 8,
|
26 |
+
"num_experts": 128,
|
27 |
+
"decoder_sparse_step": 1,
|
28 |
+
"norm_topk_prob": true
|
29 |
+
},
|
30 |
+
"vocab_size": 151936,
|
31 |
+
"context_window_size": 40960,
|
32 |
+
"sliding_window_size": -1,
|
33 |
+
"prefill_chunk_size": 2048,
|
34 |
+
"attention_sink_size": -1,
|
35 |
+
"tensor_parallel_shards": 1,
|
36 |
+
"pipeline_parallel_stages": 1,
|
37 |
+
"temperature": 0.6,
|
38 |
+
"presence_penalty": 0.0,
|
39 |
+
"frequency_penalty": 0.0,
|
40 |
+
"repetition_penalty": 1.0,
|
41 |
+
"top_p": 0.95,
|
42 |
+
"tokenizer_files": [
|
43 |
+
"tokenizer.json",
|
44 |
+
"vocab.json",
|
45 |
+
"merges.txt",
|
46 |
+
"tokenizer_config.json"
|
47 |
+
],
|
48 |
+
"tokenizer_info": {
|
49 |
+
"token_postproc_method": "byte_level",
|
50 |
+
"prepend_space_in_encode": false,
|
51 |
+
"strip_space_in_decode": false
|
52 |
+
},
|
53 |
+
"conv_template": {
|
54 |
+
"name": "qwen2",
|
55 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
56 |
+
"system_message": "You are a helpful assistant.",
|
57 |
+
"system_prefix_token_ids": null,
|
58 |
+
"add_role_after_system_message": true,
|
59 |
+
"roles": {
|
60 |
+
"user": "<|im_start|>user",
|
61 |
+
"assistant": "<|im_start|>assistant"
|
62 |
+
},
|
63 |
+
"role_templates": {
|
64 |
+
"user": "{user_message}",
|
65 |
+
"assistant": "{assistant_message}",
|
66 |
+
"tool": "{tool_message}"
|
67 |
+
},
|
68 |
+
"messages": [],
|
69 |
+
"seps": [
|
70 |
+
"<|im_end|>\n"
|
71 |
+
],
|
72 |
+
"role_content_sep": "\n",
|
73 |
+
"role_empty_sep": "\n",
|
74 |
+
"stop_str": [
|
75 |
+
"<|endoftext|>",
|
76 |
+
"<|im_end|>"
|
77 |
+
],
|
78 |
+
"stop_token_ids": [
|
79 |
+
151643,
|
80 |
+
151645
|
81 |
+
],
|
82 |
+
"function_string": "",
|
83 |
+
"use_function_calling": false
|
84 |
+
},
|
85 |
+
"pad_token_id": 151643,
|
86 |
+
"bos_token_id": 151643,
|
87 |
+
"eos_token_id": [
|
88 |
+
151645,
|
89 |
+
151643
|
90 |
+
]
|
91 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86a281ecbf19ef6038231b527e6a48e413d196a67ec9755b04c6ca6a120869d4
|
3 |
+
size 1244659712
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45057c9dfb06477bbb191d3e08ba048c588b1331137866e08db70fefaddb6d5a
|
3 |
+
size 1610612736
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4462846b0f7366b3e0d2a1a61666c3cf5b70d95c95fb70103c99cf08b0e958b0
|
3 |
+
size 75497472
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a446a04dd975c9c9d75e0f80a0cd1918079b44022e5b5ecd8c5199c3318a36ea
|
3 |
+
size 75497472
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c4e2d4ad8a818fb29e6c8a3e650fd468c93c465c53b36e37a807f54839debd7
|
3 |
+
size 67108864
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed915b74440a764b8175f12d025b7f27acaa686a6a1ec442c4ee35def8cb2d09
|
3 |
+
size 1610612736
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b79f8be5391dbc3321f261f77aa3c3c174e1b302f1b168b918ce016df3fd56f
|
3 |
+
size 3221225472
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c05b8fdb259477ba0dcccf2c99e33e97d484b14ab8ae0ccba973779d2bf1f97
|
3 |
+
size 75497472
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ade3a37c77bd13552897edc6d6b8facca512acfe7b57b042b4d2c41232376c0
|
3 |
+
size 67108864
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73a477e680d863250e69ef1b277366b4fa89752fd51543789e9bc2e13fb0598c
|
3 |
+
size 1610612736
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:031e2514306a73bc080c52c064c1583e3da1136576112eabb3fd88807395dc33
|
3 |
+
size 3221225472
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0290cd6bf8b3da4d6a16125eb315208705b6a69b268d92a6eb10a04f1eb29f06
|
3 |
+
size 75497472
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a02a8b1bffd233f7e7bb56cc59eeec2f37f51609ad2d762a7334e990be0396f4
|
3 |
+
size 67108864
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f26bb3ab4e24f34f875cfbd3707d3e72229e1f735205e79eb8700b847c6f97ac
|
3 |
+
size 67108864
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af85dad553413ea5c286fdb04ae0c6012feaa388c1841db3da6f63708d829ee6
|
3 |
+
size 1610612736
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6300f73688810bbbacc7268f3ceb92ba80c08439050d16d6deeb90e83fbed2ad
|
3 |
+
size 3221225472
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3d412d280db78f3569d58c51f227422d91742b335058cfbe260a946d7d27a97
|
3 |
+
size 75497472
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8054aee664356201d4f10f9c98e0b1a93b007ae73f682110eaec1a15625f349
|
3 |
+
size 67108864
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f39b9c4aedef6e76d16307e137be245a4445310e9d984cd231b8c39cb5ffed3
|
3 |
+
size 1610612736
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63a51268b60b74a8ee609877a91e2f7fea73d4c30aceec29cafd9dbd92901670
|
3 |
+
size 3221225472
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f93be7e4e67f57a24288c8f1cb6e661bb10e81b5f967dad5af10d9b1d939157d
|
3 |
+
size 75497472
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43244b87e6b111000a5ad1814d9ecc4d86a5fb67415a483c8c199609f9ce83e0
|
3 |
+
size 67108864
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17cc23b9807cf4cbc86f8a77296a2c64c6123908f1cbd9ae81b1e4473b3c8bd3
|
3 |
+
size 1610612736
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d81e0507c22b84248bdda5f99b4f25067cfa66a5d787b548ffd16ab2b307610
|
3 |
+
size 3221225472
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78b7d233686ad7cfd1426fa8dce4ca4c759ba6dede7a4725a4c1983e8cd28a60
|
3 |
+
size 1610612736
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e716d0a835e361b71d15e0eac836c24197de519ff6ee8efd217dcfa19044806
|
3 |
+
size 75497472
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68b665177452ee0a55f913fdd02f16925734b860a2809bfba5750931ad1810a2
|
3 |
+
size 67108864
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb2f1fefa8bc796472f78ae7b4d3ad966c1da170c0ef58ddf7fc84f3dfc26ddd
|
3 |
+
size 1610612736
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f736f3c8badfa7b2a5c0a4fdc2a3cba5aa14d5c6cb13eb278d08f6246ff47e65
|
3 |
+
size 3221225472
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cc23c6045c64a993378aada8d5f6d76a857e0620a43f32fde4ed17056adbb38
|
3 |
+
size 75497472
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f236b6fa96900243d7c11173bf849a9d2dfaccc7d52813f3a8210b47cd133c1
|
3 |
+
size 67108864
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8544aac73a45a877eb71ce47d8df51c276ebd394b8b5b39b36a97a25b4c3380
|
3 |
+
size 1610612736
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04c3a5674e1276536e994a45a8357f4f408e6bb3260aec3c0696eb8ec42774ea
|
3 |
+
size 3221225472
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1daa0dcd0ab49f485d6a1c84001dffd97814414712ce2fa76a71c318e0d47611
|
3 |
+
size 75497472
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e637b2b882b05782e1558ade6de7bc0eac56e8c384615370c45e159456a5913
|
3 |
+
size 67108864
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ed1ee86cba3868f78357f0820356d64c9ef27d3a4fee4253ab7d5cc2ad96cea
|
3 |
+
size 3221225472
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2de9f5ffe08042ec36486759abe51da5abe4ec2f3c83573664be7ba4c4c192ca
|
3 |
+
size 1610612736
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68c26e6e0c9aeb3d78e7337a2ef376bac8ca8176c661d00a8ced324199c73250
|
3 |
+
size 3221225472
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecd90e1d8ec6a4af32544e97f726d475d112f4917ad11c4991c2ccbcb849db0b
|
3 |
+
size 33054208
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47322fc88f94a7b11b297f190355d49ce6787d4061966a24f576a70265c3b625
|
3 |
+
size 75497472
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:974b6375b3b32e9039b055db018a4a44ae38cb651f6b39be5ec20b1a325cebc1
|
3 |
+
size 67108864
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15de13642207b1841b92a87f36986d81a7aa769bb316d8d6c468b4912e325f5
|
3 |
+
size 1610612736
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1b3e9319b4e6798c30ab7f12d7970fbb4719f8a990ca92ebac94ea99b256a89
|
3 |
+
size 3221225472
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5161f208491d1c3ad4d4641739ebd5edf4a54d981a2bbb387640ac1777b9cde
|
3 |
+
size 75497472
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a930deb2aa2471e82ca27b18756176078359859b8f44808b8789eca3629f6735
|
3 |
+
size 67108864
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f665fe950d1ab140a177f61d49a90b4b2426508643c87ab305d25b45b391ce6
|
3 |
+
size 1610612736
|