Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- merges.txt +0 -0
- mlc-chat-config.json +85 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,85 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen3",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 2048,
|
8 |
+
"intermediate_size": 6144,
|
9 |
+
"attention_bias": false,
|
10 |
+
"num_attention_heads": 16,
|
11 |
+
"num_hidden_layers": 28,
|
12 |
+
"num_key_value_heads": 8,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"rope_theta": 1000000,
|
15 |
+
"vocab_size": 151936,
|
16 |
+
"tie_word_embeddings": true,
|
17 |
+
"context_window_size": 40960,
|
18 |
+
"prefill_chunk_size": 2048,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"head_dim": 128,
|
21 |
+
"dtype": "float32",
|
22 |
+
"max_batch_size": 128
|
23 |
+
},
|
24 |
+
"vocab_size": 151936,
|
25 |
+
"context_window_size": 40960,
|
26 |
+
"sliding_window_size": -1,
|
27 |
+
"prefill_chunk_size": 2048,
|
28 |
+
"attention_sink_size": -1,
|
29 |
+
"tensor_parallel_shards": 1,
|
30 |
+
"pipeline_parallel_stages": 1,
|
31 |
+
"temperature": 0.6,
|
32 |
+
"presence_penalty": 0.0,
|
33 |
+
"frequency_penalty": 0.0,
|
34 |
+
"repetition_penalty": 1.0,
|
35 |
+
"top_p": 0.95,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"vocab.json",
|
39 |
+
"merges.txt",
|
40 |
+
"tokenizer_config.json"
|
41 |
+
],
|
42 |
+
"tokenizer_info": {
|
43 |
+
"token_postproc_method": "byte_level",
|
44 |
+
"prepend_space_in_encode": false,
|
45 |
+
"strip_space_in_decode": false
|
46 |
+
},
|
47 |
+
"conv_template": {
|
48 |
+
"name": "qwen2",
|
49 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
50 |
+
"system_message": "You are a helpful assistant.",
|
51 |
+
"system_prefix_token_ids": null,
|
52 |
+
"add_role_after_system_message": true,
|
53 |
+
"roles": {
|
54 |
+
"user": "<|im_start|>user",
|
55 |
+
"assistant": "<|im_start|>assistant"
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
"<|im_end|>\n"
|
65 |
+
],
|
66 |
+
"role_content_sep": "\n",
|
67 |
+
"role_empty_sep": "\n",
|
68 |
+
"stop_str": [
|
69 |
+
"<|endoftext|>",
|
70 |
+
"<|im_end|>"
|
71 |
+
],
|
72 |
+
"stop_token_ids": [
|
73 |
+
151643,
|
74 |
+
151645
|
75 |
+
],
|
76 |
+
"function_string": "",
|
77 |
+
"use_function_calling": false
|
78 |
+
},
|
79 |
+
"pad_token_id": 151643,
|
80 |
+
"bos_token_id": 151643,
|
81 |
+
"eos_token_id": [
|
82 |
+
151645,
|
83 |
+
151643
|
84 |
+
]
|
85 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bccd2bc5ec321a16d2c273d27634c9fe272fa5814fecc1fa48790fe7793edead
|
3 |
+
size 622329856
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65efed6e9ddaa313b65e46cbaca9a30c6cc92fff540aca242e9ce6355ea6442a
|
3 |
+
size 50331648
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acbcf53efa5e28e42d6cf4d86b5262b84958472c3d03f04fa86e1f734501d6ae
|
3 |
+
size 25165824
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:195e08f6b79eb245bb40737ad64c4307f38af4701aec86303559e0b1be0099fb
|
3 |
+
size 50331648
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:795c01871a3c1f85e66a65fd776ab58f105ae9558ddd8d83072eabc9ab390068
|
3 |
+
size 25174528
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f2dd95d5b572b4d529b5b3f54351ecc272372799257000994d27163dd1d3a27
|
3 |
+
size 25165824
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:652f98beaf5bdc0cebc4b01d9b8b9482dcff085c997deef6fbba8376e5bb462f
|
3 |
+
size 50331648
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:565595b3edf3cc998c821e3797e99c4b4a049e8029d069b482a3074e6c23ad95
|
3 |
+
size 25174528
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:897b5b8536aa504017faff569ec0605b8d4e0cba8eed1a2a677a91ad1f818bbc
|
3 |
+
size 25165824
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dc148b6c7632880db2e2bf07bf9236e4abf44d688226cce33c1db928b295d21
|
3 |
+
size 50331648
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a627302490d41d11609bf63f219a549a38febca610201dab61f04fb3b8a6f0f6
|
3 |
+
size 25174528
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34b7cb3fa5893336b833da3bc547d75647c40073219178d0fd0eeb85d475347e
|
3 |
+
size 25165824
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa24455302c97e36bb574ded6d7bbb3190f2211bca677e5f814cea5378d1e198
|
3 |
+
size 16777216
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fe15ecf104cb110cf84c2e17865171c5a2a3a6e97680ef27a54590548a9202d
|
3 |
+
size 50331648
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73530d66d913525b40dc8ad698e43d88d224f5718cb8d50d6785812220c8fa84
|
3 |
+
size 25174528
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3da55fe516b8e25d239670cfc8b87f3d1ab8435790793238f86ce21665afbe1
|
3 |
+
size 25165824
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a52f5228a50e05979b882458ba5fe81d17b83f7f9d3c7a3920caaa437c0a31f5
|
3 |
+
size 50331648
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f193651617e672da5ade3dfe877558e39a44d08b2a8ab31a6742612486915ba
|
3 |
+
size 25174528
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97edd3137a13011115e59ae39b1a9e423f73aee6146ad2beba389e103905c6b5
|
3 |
+
size 25165824
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:423992cb3188bdd7638e22d0a99d576d213ce5f79ada2e71bd0fcbbe8b4198bb
|
3 |
+
size 50331648
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9de327dd6ff652795bfcebfe18a1c7541141da46d2cbed366420c82fa9221a7e
|
3 |
+
size 25174528
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b09dc9101687a577642e4a7e23f71cc575ce16860fe7962b4a31a458efb3dca
|
3 |
+
size 25165824
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df7b6fab8f4c3c49e1fd95a6a87bf6100d1c2a862ebd9df7239fa5f7d3c51e7d
|
3 |
+
size 50331648
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0563d92a1d3ab9a92fe628f53f38e6643b8062616cbc1620b99ceab9b04b0f6
|
3 |
+
size 25174272
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73fff44777334aa00a6230833dc907e8e761a9ba375bf76ab27f343ea1f0abad
|
3 |
+
size 25174528
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44ed3fa27db73dd913d6e47dd705416af76a30d15bafd948043f8fb472c2dfec
|
3 |
+
size 25165824
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f6aef49936e3b0e051227c86e8710d67b8d434b4e0a8e3e81e110739811fec8
|
3 |
+
size 50331648
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d10bd85efe7ab2d0b5892184349197862d480e836ca5c2a03c4356aa32f09bda
|
3 |
+
size 25174528
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d9e46c5831e4eb448bc61c86317a170b894d23473168412f91fc8a15b21ab6f
|
3 |
+
size 25165824
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb5146f5eb37e758c752e2778b05e065730237085bd29bd16e17ea3e3572509d
|
3 |
+
size 50331648
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efb45a454dfbff8281d49e5992dfc6686c030877626c0ecb372307f48289d7d8
|
3 |
+
size 25174528
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a73e177cece4a4780445389b14756f8396a7112435278988902b5e06e27a4fd
|
3 |
+
size 25165824
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4020e929ea57d4cfefad771163243b91f470dae281549d1cf063df9019d39914
|
3 |
+
size 50331648
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eed11ddb5fe48f9c32f05133b38fd9e25407f3a166e19561fa398414f90789a4
|
3 |
+
size 25174528
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8e4479d59e7a91676634a0a355ed2921750288da45f1a75d8f3f928498c3bc9
|
3 |
+
size 25165824
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd04a54267b103becb94cb0c3903c54346b9a78e860a053339d19579009aca95
|
3 |
+
size 25165824
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9594a633237f32e853a55dc53a4d9cc51f3c7be7e001a295ef435492cc73b530
|
3 |
+
size 50331648
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ae42f6f59943dfd17717937ae77c3bdd4d0fb6eefadfee90b29fb5202903e16
|
3 |
+
size 25174528
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa540a0108bcec1f225bb660825e013490d60d1fb98f5b7fa1a1403720b843cc
|
3 |
+
size 25165824
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1867ba9a3acf0f8eba1dbf0a5e2d159d05cb72d3d7be0162cf64da71b60096c4
|
3 |
+
size 50331648
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95b8d82edd59444f991efc3bd9b01b15d69053e96536c1f78dfea881f47f4559
|
3 |
+
size 25174528
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22e574b8dc77061adbf4690b329a1728cf33c85a5e75eef7ec2c4e8ff6dd71d0
|
3 |
+
size 25165824
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12d5a6249f06c1c9f5726ea99ecfa0c17c0455a2313c2ef6138c6f67c21409ad
|
3 |
+
size 50331648
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:923bc1b55f4ea28cfb6f3800b5a871ef806dde054e11678a2f3ccde69ef22402
|
3 |
+
size 25174528
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:573c6820d78f920aee4d84a0f8fde84ca766912685ee84a2d30e3033f583d628
|
3 |
+
size 25165824
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13efe9f59b446d23ed4b9f86cc86287507781bb8ae86704dfd067248b4054e1d
|
3 |
+
size 50331648
|