Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- merges.txt +0 -0
- mlc-chat-config.json +85 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,85 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen3",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 5120,
|
8 |
+
"intermediate_size": 25600,
|
9 |
+
"attention_bias": false,
|
10 |
+
"num_attention_heads": 64,
|
11 |
+
"num_hidden_layers": 64,
|
12 |
+
"num_key_value_heads": 8,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"rope_theta": 1000000,
|
15 |
+
"vocab_size": 151936,
|
16 |
+
"tie_word_embeddings": false,
|
17 |
+
"context_window_size": 40960,
|
18 |
+
"prefill_chunk_size": 2048,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"head_dim": 128,
|
21 |
+
"dtype": "float32",
|
22 |
+
"max_batch_size": 128
|
23 |
+
},
|
24 |
+
"vocab_size": 151936,
|
25 |
+
"context_window_size": 40960,
|
26 |
+
"sliding_window_size": -1,
|
27 |
+
"prefill_chunk_size": 2048,
|
28 |
+
"attention_sink_size": -1,
|
29 |
+
"tensor_parallel_shards": 1,
|
30 |
+
"pipeline_parallel_stages": 1,
|
31 |
+
"temperature": 0.6,
|
32 |
+
"presence_penalty": 0.0,
|
33 |
+
"frequency_penalty": 0.0,
|
34 |
+
"repetition_penalty": 1.0,
|
35 |
+
"top_p": 0.95,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"vocab.json",
|
39 |
+
"merges.txt",
|
40 |
+
"tokenizer_config.json"
|
41 |
+
],
|
42 |
+
"tokenizer_info": {
|
43 |
+
"token_postproc_method": "byte_level",
|
44 |
+
"prepend_space_in_encode": false,
|
45 |
+
"strip_space_in_decode": false
|
46 |
+
},
|
47 |
+
"conv_template": {
|
48 |
+
"name": "qwen2",
|
49 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
50 |
+
"system_message": "You are a helpful assistant.",
|
51 |
+
"system_prefix_token_ids": null,
|
52 |
+
"add_role_after_system_message": true,
|
53 |
+
"roles": {
|
54 |
+
"user": "<|im_start|>user",
|
55 |
+
"assistant": "<|im_start|>assistant"
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
"<|im_end|>\n"
|
65 |
+
],
|
66 |
+
"role_content_sep": "\n",
|
67 |
+
"role_empty_sep": "\n",
|
68 |
+
"stop_str": [
|
69 |
+
"<|endoftext|>",
|
70 |
+
"<|im_end|>"
|
71 |
+
],
|
72 |
+
"stop_token_ids": [
|
73 |
+
151643,
|
74 |
+
151645
|
75 |
+
],
|
76 |
+
"function_string": "",
|
77 |
+
"use_function_calling": false
|
78 |
+
},
|
79 |
+
"pad_token_id": 151643,
|
80 |
+
"bos_token_id": 151643,
|
81 |
+
"eos_token_id": [
|
82 |
+
151645,
|
83 |
+
151643
|
84 |
+
]
|
85 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff0d0629283ca39aa7463b551128eb08b14852f063607bc52c22b34871e4a3b4
|
3 |
+
size 1555824640
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:961a81d70cb6cdf10115732263bccc29af3e4d5335e16c74af445977056eddc8
|
3 |
+
size 262144000
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:266cf172f350d07d89afa4d98187a5dc127a95efaf69fec624596983eb8bd883
|
3 |
+
size 104857600
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f53479396d0e298216d3c07e3e9f4b6234b213d6c12bd579e012dd77b91c151d
|
3 |
+
size 262144000
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f84bfa74ea72e41c608d3170f2fa820ae3b69820bb30ea529d1375f91cbd3ed4
|
3 |
+
size 524288000
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38c7edd0acf171d48ff0bc330c77ad96945d52fa03734c2a2dbc309d09908107
|
3 |
+
size 104857600
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:134280a7af4f3272d0ba37eaf622dd9af992b469502b452adef4b73d9e501d5d
|
3 |
+
size 83886080
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:980e61027f2954b296e959527d3684bc82070c5124559eef937ac0562d47113f
|
3 |
+
size 262144000
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c4f6075069a990dc6488c5a06b39d744d9a034a442956c75e7e0e30c0df43af
|
3 |
+
size 524288000
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4119b37cf64511ebc5b6d78ade321fec4ec305f083f7b638d86aa70d937d7653
|
3 |
+
size 104857600
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5efa2cde859117f333f091fb56cf6c13fcf6ce80440df2566aab214f85ff9af9
|
3 |
+
size 83886080
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9b7532443a32c461ddaba886c7266327110251fcefcce92711ba1f4139a92cb
|
3 |
+
size 262144000
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46ecc56cf6207df463b57a92235f9bb40655fb06f8091e5c3a18e16c83216541
|
3 |
+
size 524288000
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:074fec20bd9ba0b8b843982ac3da1d0a1357b2058ec2076cc9bc0575471bb617
|
3 |
+
size 83886080
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cca4d75355300192166321747fc0b5753bd3fef9f725da6c9e123bc3b005303e
|
3 |
+
size 104857600
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8dcd515b8d9d4d824f550ab23f89ba3a835e9bcb7a16bc1be35bea522d7ac1f
|
3 |
+
size 83886080
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8abd0f853ba12714def448055d03a36bc76b9bd570c954cf6b92c65681bc813a
|
3 |
+
size 524288000
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00df036b775f50a48dae448d1f490ca1ca5f65e680c8795705ec29fbb5e7e079
|
3 |
+
size 104857600
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f67d4cbef8e444d9c4b4c52e8ccb02a07b01e8a429ab274d3cec40dc0eec95ae
|
3 |
+
size 83886080
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d42e32e116532200f66fd7ce7b796a2bd4261d97c85a13c2558040d5e743f29
|
3 |
+
size 262144000
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a9673e74ba2eed80de0c54eef8c0971191b448a8146ccb577f6d0be0244a174
|
3 |
+
size 262144000
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cdb9a8a914bda770991788d43bd7a9d146703b07551fd87a20b3e94ae175094
|
3 |
+
size 524288000
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6766a57568c9012969bb9916745e123c8293bbc73214a1dacea91f851911de2
|
3 |
+
size 104857600
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e7987c61933273166ecc99b7ed18d0db310c7191b8a0db57d71dfd384a1a23d
|
3 |
+
size 83886080
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab8026a14f4bc856dda90f75568fdeaaf54aff6566d26780bd9ffab76c522632
|
3 |
+
size 262144000
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59f7a7402878d31d3b217a95588baf4d750c2dc3ecc0f91a80a567c22c746e97
|
3 |
+
size 262144000
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8917f7054ca6d86a2aab36286b7dcc62f7bb26ae7efe1333e6258e82b184934a
|
3 |
+
size 524288000
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d7b581d0a69a06a65a1bad632fe0a434751df610ff1d076fd61ad3ecb933884
|
3 |
+
size 104857600
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f727b0c02c96f8b986c8764510b250f84500687f0d3e9b50909737787898a8d
|
3 |
+
size 83886080
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abb9ac83959b1070d9abfd60aa929dc19bf4cc6715e96877f324a14e16fc2774
|
3 |
+
size 262144000
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe62285200b6ed9085fcaa15a9f64d7b9d52afa2f0abf1e23ee74227bcd462b7
|
3 |
+
size 524288000
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a4cc718fa420d0dae946fe276d072d8bb261d49a53ccd34b7db6be308eac2e9
|
3 |
+
size 104857600
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4c69850c32b0f3839d88b3a37ceebb520e4a54f7a7fded851ddbf92dd357e4c
|
3 |
+
size 83886080
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7623235557a5ec80468626f41886132bb865502e5b333276cd40b2555bb7f54e
|
3 |
+
size 524288000
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2a054023f45e9a40fc20ad4f83523224f75be929d97df9515c66a09759a0e51
|
3 |
+
size 104857600
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:246b9faf6b56699e4100d196ed3f9e59f01aa694920c9f21937231a7c9abb002
|
3 |
+
size 524288000
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9aee541244423ad497c71ab8a14ab71c13a1837461b6eb6e0127c71a9109e2c4
|
3 |
+
size 83886080
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f44651d8d4d5f9364e953f9653ec1177a076c4f4aac7b6ecc80f51efa71ac1e
|
3 |
+
size 262144000
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4939558abf626df74dbe11b0483106c4d80bfac1126c6e05edddcc5b4d57d59c
|
3 |
+
size 262144000
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb3005666d218e9da0b2fc7b390371d7b0a79f23461ec71f9df5b756710f2a63
|
3 |
+
size 524288000
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db9b68e2e88fc6eaa8639247fbc1a5db4971d88fc6b464b4edf38ad5d274eaea
|
3 |
+
size 104857600
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a533e8b2a29f9c9bdec09bde02144690363e96755b08e1c84dacb37a778858f2
|
3 |
+
size 83886080
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:293b18ebb8f8d38498c4e995e9de352ca83cf4a3420493e3aa3c63b7d2309ed1
|
3 |
+
size 262144000
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c9a6d6bdfb0d858b1976eb17e29e2ea757361d60a04d994d1e2ac8dddc90d4a
|
3 |
+
size 524288000
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:839289b434d4ce3ddaf562357a4913486fcf345b62f4a3eac84fcf12a3a75ea1
|
3 |
+
size 104857600
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96e17e29797a3be904c0e83641afede7c87c80333609052636054ad4c7d6bf82
|
3 |
+
size 83886080
|