riczhou commited on
Commit
4879165
·
verified ·
1 Parent(s): 7fb676a

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3_moe",
4
+ "quantization": "q0f16",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 4096,
8
+ "intermediate_size": 12288,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 64,
11
+ "num_hidden_layers": 94,
12
+ "num_key_value_heads": 4,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000.0,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": false,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128,
23
+ "weight_block_size": null,
24
+ "moe_intermediate_size": 1536,
25
+ "num_experts_per_tok": 8,
26
+ "num_experts": 128,
27
+ "decoder_sparse_step": 1,
28
+ "norm_topk_prob": true
29
+ },
30
+ "vocab_size": 151936,
31
+ "context_window_size": 40960,
32
+ "sliding_window_size": -1,
33
+ "prefill_chunk_size": 2048,
34
+ "attention_sink_size": -1,
35
+ "tensor_parallel_shards": 1,
36
+ "pipeline_parallel_stages": 1,
37
+ "temperature": 0.6,
38
+ "presence_penalty": 0.0,
39
+ "frequency_penalty": 0.0,
40
+ "repetition_penalty": 1.0,
41
+ "top_p": 0.95,
42
+ "tokenizer_files": [
43
+ "tokenizer.json",
44
+ "vocab.json",
45
+ "merges.txt",
46
+ "tokenizer_config.json"
47
+ ],
48
+ "tokenizer_info": {
49
+ "token_postproc_method": "byte_level",
50
+ "prepend_space_in_encode": false,
51
+ "strip_space_in_decode": false
52
+ },
53
+ "conv_template": {
54
+ "name": "qwen2",
55
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
56
+ "system_message": "You are a helpful assistant.",
57
+ "system_prefix_token_ids": null,
58
+ "add_role_after_system_message": true,
59
+ "roles": {
60
+ "user": "<|im_start|>user",
61
+ "assistant": "<|im_start|>assistant"
62
+ },
63
+ "role_templates": {
64
+ "user": "{user_message}",
65
+ "assistant": "{assistant_message}",
66
+ "tool": "{tool_message}"
67
+ },
68
+ "messages": [],
69
+ "seps": [
70
+ "<|im_end|>\n"
71
+ ],
72
+ "role_content_sep": "\n",
73
+ "role_empty_sep": "\n",
74
+ "stop_str": [
75
+ "<|endoftext|>",
76
+ "<|im_end|>"
77
+ ],
78
+ "stop_token_ids": [
79
+ 151643,
80
+ 151645
81
+ ],
82
+ "function_string": "",
83
+ "use_function_calling": false
84
+ },
85
+ "pad_token_id": 151643,
86
+ "bos_token_id": 151643,
87
+ "eos_token_id": [
88
+ 151645,
89
+ 151643
90
+ ]
91
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86a281ecbf19ef6038231b527e6a48e413d196a67ec9755b04c6ca6a120869d4
3
+ size 1244659712
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45057c9dfb06477bbb191d3e08ba048c588b1331137866e08db70fefaddb6d5a
3
+ size 1610612736
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4462846b0f7366b3e0d2a1a61666c3cf5b70d95c95fb70103c99cf08b0e958b0
3
+ size 75497472
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a446a04dd975c9c9d75e0f80a0cd1918079b44022e5b5ecd8c5199c3318a36ea
3
+ size 75497472
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c4e2d4ad8a818fb29e6c8a3e650fd468c93c465c53b36e37a807f54839debd7
3
+ size 67108864
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed915b74440a764b8175f12d025b7f27acaa686a6a1ec442c4ee35def8cb2d09
3
+ size 1610612736
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b79f8be5391dbc3321f261f77aa3c3c174e1b302f1b168b918ce016df3fd56f
3
+ size 3221225472
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c05b8fdb259477ba0dcccf2c99e33e97d484b14ab8ae0ccba973779d2bf1f97
3
+ size 75497472
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ade3a37c77bd13552897edc6d6b8facca512acfe7b57b042b4d2c41232376c0
3
+ size 67108864
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73a477e680d863250e69ef1b277366b4fa89752fd51543789e9bc2e13fb0598c
3
+ size 1610612736
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:031e2514306a73bc080c52c064c1583e3da1136576112eabb3fd88807395dc33
3
+ size 3221225472
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0290cd6bf8b3da4d6a16125eb315208705b6a69b268d92a6eb10a04f1eb29f06
3
+ size 75497472
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a02a8b1bffd233f7e7bb56cc59eeec2f37f51609ad2d762a7334e990be0396f4
3
+ size 67108864
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f26bb3ab4e24f34f875cfbd3707d3e72229e1f735205e79eb8700b847c6f97ac
3
+ size 67108864
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af85dad553413ea5c286fdb04ae0c6012feaa388c1841db3da6f63708d829ee6
3
+ size 1610612736
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6300f73688810bbbacc7268f3ceb92ba80c08439050d16d6deeb90e83fbed2ad
3
+ size 3221225472
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3d412d280db78f3569d58c51f227422d91742b335058cfbe260a946d7d27a97
3
+ size 75497472
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8054aee664356201d4f10f9c98e0b1a93b007ae73f682110eaec1a15625f349
3
+ size 67108864
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f39b9c4aedef6e76d16307e137be245a4445310e9d984cd231b8c39cb5ffed3
3
+ size 1610612736
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63a51268b60b74a8ee609877a91e2f7fea73d4c30aceec29cafd9dbd92901670
3
+ size 3221225472
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f93be7e4e67f57a24288c8f1cb6e661bb10e81b5f967dad5af10d9b1d939157d
3
+ size 75497472
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43244b87e6b111000a5ad1814d9ecc4d86a5fb67415a483c8c199609f9ce83e0
3
+ size 67108864
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17cc23b9807cf4cbc86f8a77296a2c64c6123908f1cbd9ae81b1e4473b3c8bd3
3
+ size 1610612736
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d81e0507c22b84248bdda5f99b4f25067cfa66a5d787b548ffd16ab2b307610
3
+ size 3221225472
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78b7d233686ad7cfd1426fa8dce4ca4c759ba6dede7a4725a4c1983e8cd28a60
3
+ size 1610612736
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e716d0a835e361b71d15e0eac836c24197de519ff6ee8efd217dcfa19044806
3
+ size 75497472
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68b665177452ee0a55f913fdd02f16925734b860a2809bfba5750931ad1810a2
3
+ size 67108864
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb2f1fefa8bc796472f78ae7b4d3ad966c1da170c0ef58ddf7fc84f3dfc26ddd
3
+ size 1610612736
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f736f3c8badfa7b2a5c0a4fdc2a3cba5aa14d5c6cb13eb278d08f6246ff47e65
3
+ size 3221225472
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cc23c6045c64a993378aada8d5f6d76a857e0620a43f32fde4ed17056adbb38
3
+ size 75497472
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f236b6fa96900243d7c11173bf849a9d2dfaccc7d52813f3a8210b47cd133c1
3
+ size 67108864
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8544aac73a45a877eb71ce47d8df51c276ebd394b8b5b39b36a97a25b4c3380
3
+ size 1610612736
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04c3a5674e1276536e994a45a8357f4f408e6bb3260aec3c0696eb8ec42774ea
3
+ size 3221225472
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1daa0dcd0ab49f485d6a1c84001dffd97814414712ce2fa76a71c318e0d47611
3
+ size 75497472
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e637b2b882b05782e1558ade6de7bc0eac56e8c384615370c45e159456a5913
3
+ size 67108864
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ed1ee86cba3868f78357f0820356d64c9ef27d3a4fee4253ab7d5cc2ad96cea
3
+ size 3221225472
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2de9f5ffe08042ec36486759abe51da5abe4ec2f3c83573664be7ba4c4c192ca
3
+ size 1610612736
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68c26e6e0c9aeb3d78e7337a2ef376bac8ca8176c661d00a8ced324199c73250
3
+ size 3221225472
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecd90e1d8ec6a4af32544e97f726d475d112f4917ad11c4991c2ccbcb849db0b
3
+ size 33054208
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47322fc88f94a7b11b297f190355d49ce6787d4061966a24f576a70265c3b625
3
+ size 75497472
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:974b6375b3b32e9039b055db018a4a44ae38cb651f6b39be5ec20b1a325cebc1
3
+ size 67108864
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c15de13642207b1841b92a87f36986d81a7aa769bb316d8d6c468b4912e325f5
3
+ size 1610612736
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1b3e9319b4e6798c30ab7f12d7970fbb4719f8a990ca92ebac94ea99b256a89
3
+ size 3221225472
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5161f208491d1c3ad4d4641739ebd5edf4a54d981a2bbb387640ac1777b9cde
3
+ size 75497472
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a930deb2aa2471e82ca27b18756176078359859b8f44808b8789eca3629f6735
3
+ size 67108864
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f665fe950d1ab140a177f61d49a90b4b2426508643c87ab305d25b45b391ce6
3
+ size 1610612736