riczhou commited on
Commit
be3f138
·
verified ·
1 Parent(s): 27c9cee

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3",
4
+ "quantization": "q0f16",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 5120,
8
+ "intermediate_size": 25600,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 64,
11
+ "num_hidden_layers": 64,
12
+ "num_key_value_heads": 8,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": false,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128
23
+ },
24
+ "vocab_size": 151936,
25
+ "context_window_size": 40960,
26
+ "sliding_window_size": -1,
27
+ "prefill_chunk_size": 2048,
28
+ "attention_sink_size": -1,
29
+ "tensor_parallel_shards": 1,
30
+ "pipeline_parallel_stages": 1,
31
+ "temperature": 0.6,
32
+ "presence_penalty": 0.0,
33
+ "frequency_penalty": 0.0,
34
+ "repetition_penalty": 1.0,
35
+ "top_p": 0.95,
36
+ "tokenizer_files": [
37
+ "tokenizer.json",
38
+ "vocab.json",
39
+ "merges.txt",
40
+ "tokenizer_config.json"
41
+ ],
42
+ "tokenizer_info": {
43
+ "token_postproc_method": "byte_level",
44
+ "prepend_space_in_encode": false,
45
+ "strip_space_in_decode": false
46
+ },
47
+ "conv_template": {
48
+ "name": "qwen2",
49
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
+ "system_message": "You are a helpful assistant.",
51
+ "system_prefix_token_ids": null,
52
+ "add_role_after_system_message": true,
53
+ "roles": {
54
+ "user": "<|im_start|>user",
55
+ "assistant": "<|im_start|>assistant"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ "<|im_end|>\n"
65
+ ],
66
+ "role_content_sep": "\n",
67
+ "role_empty_sep": "\n",
68
+ "stop_str": [
69
+ "<|endoftext|>",
70
+ "<|im_end|>"
71
+ ],
72
+ "stop_token_ids": [
73
+ 151643,
74
+ 151645
75
+ ],
76
+ "function_string": "",
77
+ "use_function_calling": false
78
+ },
79
+ "pad_token_id": 151643,
80
+ "bos_token_id": 151643,
81
+ "eos_token_id": [
82
+ 151645,
83
+ 151643
84
+ ]
85
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff0d0629283ca39aa7463b551128eb08b14852f063607bc52c22b34871e4a3b4
3
+ size 1555824640
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:961a81d70cb6cdf10115732263bccc29af3e4d5335e16c74af445977056eddc8
3
+ size 262144000
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:266cf172f350d07d89afa4d98187a5dc127a95efaf69fec624596983eb8bd883
3
+ size 104857600
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f53479396d0e298216d3c07e3e9f4b6234b213d6c12bd579e012dd77b91c151d
3
+ size 262144000
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f84bfa74ea72e41c608d3170f2fa820ae3b69820bb30ea529d1375f91cbd3ed4
3
+ size 524288000
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38c7edd0acf171d48ff0bc330c77ad96945d52fa03734c2a2dbc309d09908107
3
+ size 104857600
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:134280a7af4f3272d0ba37eaf622dd9af992b469502b452adef4b73d9e501d5d
3
+ size 83886080
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:980e61027f2954b296e959527d3684bc82070c5124559eef937ac0562d47113f
3
+ size 262144000
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c4f6075069a990dc6488c5a06b39d744d9a034a442956c75e7e0e30c0df43af
3
+ size 524288000
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4119b37cf64511ebc5b6d78ade321fec4ec305f083f7b638d86aa70d937d7653
3
+ size 104857600
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5efa2cde859117f333f091fb56cf6c13fcf6ce80440df2566aab214f85ff9af9
3
+ size 83886080
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9b7532443a32c461ddaba886c7266327110251fcefcce92711ba1f4139a92cb
3
+ size 262144000
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46ecc56cf6207df463b57a92235f9bb40655fb06f8091e5c3a18e16c83216541
3
+ size 524288000
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:074fec20bd9ba0b8b843982ac3da1d0a1357b2058ec2076cc9bc0575471bb617
3
+ size 83886080
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cca4d75355300192166321747fc0b5753bd3fef9f725da6c9e123bc3b005303e
3
+ size 104857600
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8dcd515b8d9d4d824f550ab23f89ba3a835e9bcb7a16bc1be35bea522d7ac1f
3
+ size 83886080
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8abd0f853ba12714def448055d03a36bc76b9bd570c954cf6b92c65681bc813a
3
+ size 524288000
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00df036b775f50a48dae448d1f490ca1ca5f65e680c8795705ec29fbb5e7e079
3
+ size 104857600
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f67d4cbef8e444d9c4b4c52e8ccb02a07b01e8a429ab274d3cec40dc0eec95ae
3
+ size 83886080
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d42e32e116532200f66fd7ce7b796a2bd4261d97c85a13c2558040d5e743f29
3
+ size 262144000
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a9673e74ba2eed80de0c54eef8c0971191b448a8146ccb577f6d0be0244a174
3
+ size 262144000
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cdb9a8a914bda770991788d43bd7a9d146703b07551fd87a20b3e94ae175094
3
+ size 524288000
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6766a57568c9012969bb9916745e123c8293bbc73214a1dacea91f851911de2
3
+ size 104857600
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e7987c61933273166ecc99b7ed18d0db310c7191b8a0db57d71dfd384a1a23d
3
+ size 83886080
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab8026a14f4bc856dda90f75568fdeaaf54aff6566d26780bd9ffab76c522632
3
+ size 262144000
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59f7a7402878d31d3b217a95588baf4d750c2dc3ecc0f91a80a567c22c746e97
3
+ size 262144000
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8917f7054ca6d86a2aab36286b7dcc62f7bb26ae7efe1333e6258e82b184934a
3
+ size 524288000
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d7b581d0a69a06a65a1bad632fe0a434751df610ff1d076fd61ad3ecb933884
3
+ size 104857600
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f727b0c02c96f8b986c8764510b250f84500687f0d3e9b50909737787898a8d
3
+ size 83886080
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abb9ac83959b1070d9abfd60aa929dc19bf4cc6715e96877f324a14e16fc2774
3
+ size 262144000
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe62285200b6ed9085fcaa15a9f64d7b9d52afa2f0abf1e23ee74227bcd462b7
3
+ size 524288000
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a4cc718fa420d0dae946fe276d072d8bb261d49a53ccd34b7db6be308eac2e9
3
+ size 104857600
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4c69850c32b0f3839d88b3a37ceebb520e4a54f7a7fded851ddbf92dd357e4c
3
+ size 83886080
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7623235557a5ec80468626f41886132bb865502e5b333276cd40b2555bb7f54e
3
+ size 524288000
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2a054023f45e9a40fc20ad4f83523224f75be929d97df9515c66a09759a0e51
3
+ size 104857600
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:246b9faf6b56699e4100d196ed3f9e59f01aa694920c9f21937231a7c9abb002
3
+ size 524288000
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9aee541244423ad497c71ab8a14ab71c13a1837461b6eb6e0127c71a9109e2c4
3
+ size 83886080
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f44651d8d4d5f9364e953f9653ec1177a076c4f4aac7b6ecc80f51efa71ac1e
3
+ size 262144000
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4939558abf626df74dbe11b0483106c4d80bfac1126c6e05edddcc5b4d57d59c
3
+ size 262144000
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb3005666d218e9da0b2fc7b390371d7b0a79f23461ec71f9df5b756710f2a63
3
+ size 524288000
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db9b68e2e88fc6eaa8639247fbc1a5db4971d88fc6b464b4edf38ad5d274eaea
3
+ size 104857600
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a533e8b2a29f9c9bdec09bde02144690363e96755b08e1c84dacb37a778858f2
3
+ size 83886080
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:293b18ebb8f8d38498c4e995e9de352ca83cf4a3420493e3aa3c63b7d2309ed1
3
+ size 262144000
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c9a6d6bdfb0d858b1976eb17e29e2ea757361d60a04d994d1e2ac8dddc90d4a
3
+ size 524288000
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:839289b434d4ce3ddaf562357a4913486fcf345b62f4a3eac84fcf12a3a75ea1
3
+ size 104857600
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96e17e29797a3be904c0e83641afede7c87c80333609052636054ad4c7d6bf82
3
+ size 83886080