riczhou commited on
Commit
ca69851
·
verified ·
1 Parent(s): a0f1f6f

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3",
4
+ "quantization": "q4f32_1",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 2560,
8
+ "intermediate_size": 9728,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 32,
11
+ "num_hidden_layers": 36,
12
+ "num_key_value_heads": 8,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": true,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128
23
+ },
24
+ "vocab_size": 151936,
25
+ "context_window_size": 40960,
26
+ "sliding_window_size": -1,
27
+ "prefill_chunk_size": 2048,
28
+ "attention_sink_size": -1,
29
+ "tensor_parallel_shards": 1,
30
+ "pipeline_parallel_stages": 1,
31
+ "temperature": 0.6,
32
+ "presence_penalty": 0.0,
33
+ "frequency_penalty": 0.0,
34
+ "repetition_penalty": 1.0,
35
+ "top_p": 0.95,
36
+ "tokenizer_files": [
37
+ "tokenizer.json",
38
+ "vocab.json",
39
+ "merges.txt",
40
+ "tokenizer_config.json"
41
+ ],
42
+ "tokenizer_info": {
43
+ "token_postproc_method": "byte_level",
44
+ "prepend_space_in_encode": false,
45
+ "strip_space_in_decode": false
46
+ },
47
+ "conv_template": {
48
+ "name": "qwen2",
49
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
+ "system_message": "You are a helpful assistant.",
51
+ "system_prefix_token_ids": null,
52
+ "add_role_after_system_message": true,
53
+ "roles": {
54
+ "user": "<|im_start|>user",
55
+ "assistant": "<|im_start|>assistant"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ "<|im_end|>\n"
65
+ ],
66
+ "role_content_sep": "\n",
67
+ "role_empty_sep": "\n",
68
+ "stop_str": [
69
+ "<|endoftext|>",
70
+ "<|im_end|>"
71
+ ],
72
+ "stop_token_ids": [
73
+ 151643,
74
+ 151645
75
+ ],
76
+ "function_string": "",
77
+ "use_function_calling": false
78
+ },
79
+ "pad_token_id": 151643,
80
+ "bos_token_id": 151643,
81
+ "eos_token_id": [
82
+ 151645,
83
+ 151643
84
+ ]
85
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:803a03d6c71151203b15959a5506046b3ac94a370da440dae2e380b3c67d5645
3
+ size 194478080
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab29357fd1a7a08948b9a5cc2fc6a6c483078383a5c675e53402a1bc75f0c3bb
3
+ size 24314880
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:544301b2dea40e94338995f604cf059a78fa338da0cd8b5e8ae35e496e7812ef
3
+ size 24903680
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50df64a7abbcfef5d4c52137a6fd0fd52598941ffb40d1c964c68a52bb5602d3
3
+ size 31877632
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd92bdc41f40a70fbe20827ef0390abb2f082b96b59769d24f5b0e4f479e2aa2
3
+ size 24903680
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1967eba269fb57cedc7a1d5e1c1719dcb853b6d9e937b2d2a726db36d74fe5ac
3
+ size 31877632
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae9003edbedfc127d122ac614c9774e5db588ebafff83198f44f6d1317576bd1
3
+ size 24903680
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f9a2ca0f074ce9af2bff0f47845d9ecadc9b998c221fe50c41326c1203110dc
3
+ size 24903680
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5e34658091b217b87a47e393826ed950f3a77f438c07d759228f7c50636267e
3
+ size 31872512
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e763adb7d587c736c4fba728ae52656fcabf5da37b941463f9256af8f1deee0
3
+ size 24903680
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40d6a8bebf90be94cf20d0edd77cd80d5dd79ed8690762c18500663ed91bcc92
3
+ size 31872512
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:835f56d49ed780c7fdeba0f0312497db08e22eb7cfc048ed24152feb26a846c4
3
+ size 24903680
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f157e350cea6dadbd906a6a9998ab017e3a1fe07fa4dccbb2cfc9be68c8b94a2
3
+ size 24903680
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7ac3c013c4cdae40884b0760225b98360f9ba6331348bb80a1e91c4521cc96a
3
+ size 31877632
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc6e145d70b226e645341649d975bba83ea886522cfcb79cbb6b9d1775369359
3
+ size 24903680
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c26dd7beb3197ad95cb6532e0a344caae17a4bf2469b1e4de4e7db0e19e51eb3
3
+ size 31877632
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cfa09e2a9c31efda9e94ad822d6dd357f3b00c56ae0be0e55ea196594b8c69f
3
+ size 24903680
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e6f361abdda778736066a8e94ac2cf288b4d90eb3961a08a466dad4e306cba1
3
+ size 31877632
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:203b74b0c96d2b974bdc46c2afae74cf1a330f7dcfd45f3bf9b938c4f7791ff5
3
+ size 24903680
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86e8a1da3075d0d755693b131e24222e3bd351ebb005b389b9ec1bf9c169a1f4
3
+ size 31877632
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ff7920bf6be06898c7982ddaf8b7b36e7d3b3f114edc05c21d2f9ff7b45565d
3
+ size 24903680
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e47a91e8b997ff97098ac87a115c974a4f82c27b5d736acf5ef03823d3370b0
3
+ size 31877632
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0c343468adaf8fb0bd4615ad7a9f0e341d21a5ee66c508e17af2d70564e69b3
3
+ size 24903680
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b9c78e7553e394a112c28258ceb549788c5647d711a2977660af887e1cab8d1
3
+ size 31877632
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:536bb8efda07245f4f39f773c7db73451e6924799816ddfd6c8a9707f93ac337
3
+ size 31877632
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:289794ad588e5004b4b1b420fcc90562d3022fc482608387d325171d4640ac36
3
+ size 24903680
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78b1387dcf12afc448131de3a0f6fe16cd424e7f56786476720ca9a1e5a152b9
3
+ size 31877632
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dced4e001d7046ad2d4cbc8e9795b0bb8ce96cb8d4f2d7cccdc63723405820e
3
+ size 31887872
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49179c6bbc80085ea6119e0c96476fdc370827ca5ad01a4e1ceefd71e34ba98d
3
+ size 24903680
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3ecb4fe43f9ba991ffa4b9825103677417d83d5b88862f81b0cf0c6bbc4e06b
3
+ size 31877632
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23e6e002218f09169af86a9fb53ddc0f1ce9100d685952eb33a451f455426402
3
+ size 24903680
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd84e6cc916a7bda901f16b3b2681b0e61918463315fd84e5e62d3fb66e5bccb
3
+ size 31877632
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41d371d30b4dd54b98b99a4d86a056148538836ac1b675ad93f08b3d042769ff
3
+ size 24903680
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:409e9eccda5b35d9eb9e2fb2d9c35ea80a3c706b24f28eac6df065cffe2dd4d9
3
+ size 31877632
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4ac50f8f25e8b16074a72c43f68d38e147ef37a97cb6c841af7685ff4ad1b10
3
+ size 24903680
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5997da5af30262adce068841441151d90ca3b79f1de85739f1392dcc4c50a1cf
3
+ size 24903680
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a31ab38a4084130913d027fc43604dae71b87fa96069845125da32e929f1d7d8
3
+ size 31877632
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f49ae6ca93bf47ce1260999e0ff765ddc5b3ced5b2ae877e415a8e190293bf18
3
+ size 24903680
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c048ccc934fbd733c95863974dd8d2db59c8dc9a0e5b2536a94eb5bb7eaa05c
3
+ size 31877632
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bd73c9fb17b481337353a1ff85f3cb332454b746e75dc5bd1489c483de8a34b
3
+ size 24903680
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3300e8610c344ca0c0d11c0474bcbdb555c38269a0ce70ca729d9bd23e87403
3
+ size 31877632
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfc611af1ac71fc371816891382ce896c82cb6f31e285254541e4e59d33d2f5b
3
+ size 24903680
params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:226854995e3aa336ea43f274546f03af6e7b5d5c91e153efa77090822ec40463
3
+ size 31877632
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b64d91e41d0b1d5de008e36be3c5d9610e43ec5cef02906257bf73d9a124e88
3
+ size 24903680
params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c31857fc861f3ac7e5987edac1233489744e4926c14b7eb9ef553e2d6cf15504
3
+ size 31877632