riczhou commited on
Commit
e013b5e
·
verified ·
1 Parent(s): 5cf8a10

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
mlc-chat-config.json ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "gemma3",
4
+ "quantization": "q0f32",
5
+ "model_config": {
6
+ "text_config": {
7
+ "hidden_size": 2560,
8
+ "intermediate_size": 10240,
9
+ "num_hidden_layers": 34,
10
+ "attention_bias": false,
11
+ "num_attention_heads": 8,
12
+ "num_key_value_heads": 4,
13
+ "head_dim": 256,
14
+ "rms_norm_eps": 1e-06,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "position_embedding_base": 10000,
17
+ "context_window_size": 8192,
18
+ "prefill_chunk_size": 8192,
19
+ "query_pre_attn_scalar": 256,
20
+ "sliding_window": 1024,
21
+ "kwargs": {
22
+ "model_type": "gemma3_text",
23
+ "rope_scaling": {
24
+ "factor": 8.0,
25
+ "rope_type": "linear"
26
+ }
27
+ }
28
+ },
29
+ "vocab_size": 262208,
30
+ "tensor_parallel_shards": 1,
31
+ "max_batch_size": 128,
32
+ "context_window_size": 8192,
33
+ "sliding_window_size": -1,
34
+ "prefill_chunk_size": 8192,
35
+ "is_text_model": false
36
+ },
37
+ "vocab_size": 262208,
38
+ "context_window_size": 8192,
39
+ "sliding_window_size": -1,
40
+ "prefill_chunk_size": 8192,
41
+ "attention_sink_size": -1,
42
+ "tensor_parallel_shards": 1,
43
+ "pipeline_parallel_stages": 1,
44
+ "temperature": 1.0,
45
+ "presence_penalty": 0.0,
46
+ "frequency_penalty": 0.0,
47
+ "repetition_penalty": 1.0,
48
+ "top_p": 0.95,
49
+ "tokenizer_files": [
50
+ "tokenizer.model",
51
+ "tokenizer.json",
52
+ "added_tokens.json",
53
+ "tokenizer_config.json"
54
+ ],
55
+ "tokenizer_info": {
56
+ "token_postproc_method": "byte_fallback",
57
+ "prepend_space_in_encode": false,
58
+ "strip_space_in_decode": false
59
+ },
60
+ "conv_template": {
61
+ "name": "gemma_instruction",
62
+ "system_template": "{system_message}",
63
+ "system_message": "",
64
+ "system_prefix_token_ids": [
65
+ 2
66
+ ],
67
+ "add_role_after_system_message": true,
68
+ "roles": {
69
+ "user": "<start_of_turn>user",
70
+ "assistant": "<start_of_turn>model"
71
+ },
72
+ "role_templates": {
73
+ "user": "{user_message}",
74
+ "assistant": "{assistant_message}",
75
+ "tool": "{tool_message}"
76
+ },
77
+ "messages": [],
78
+ "seps": [
79
+ "<end_of_turn>\n"
80
+ ],
81
+ "role_content_sep": "\n",
82
+ "role_empty_sep": "\n",
83
+ "stop_str": [
84
+ "<end_of_turn>"
85
+ ],
86
+ "stop_token_ids": [
87
+ 1,
88
+ 107
89
+ ],
90
+ "function_string": "",
91
+ "use_function_calling": false
92
+ },
93
+ "pad_token_id": 0,
94
+ "bos_token_id": 2,
95
+ "eos_token_id": [
96
+ 1,
97
+ 106
98
+ ]
99
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84a56ee03e66003602b56de104e739e89bac4cdb374237ba90ae88813badfe65
3
+ size 1342504960
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5499f2f069f5ac1bc309d802d3f75191cf7da41d7489a57790e4720abbbb897
3
+ size 52428800
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78fd168e73131a0aa5058faff5d23034bd44888a3beab6fecce5cbd3b677b868
3
+ size 104857600
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1659b99d8ae756e27c4f7cc0f169f98e35a245fa29b481352a6591f580586ab4
3
+ size 104857600
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93a48a48318e5dd33926858e73d6927f5bf4e223a2f9b55c8d5f1839814aba05
3
+ size 31478784
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a024fc6e5e60783b5d1732c047e86d722bee1ecb4803856942351ab9b457f177
3
+ size 31462912
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beba06e746ffc6461be1fd2b0f43b28d076cac39b2d93dc7b7d7e6e02b1360e1
3
+ size 31478784
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d351ebdabffc75fa649799626527797955c44a86840c26a5037dc01cad4be0a
3
+ size 52428800
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a9082bc21960f26c73e9ce50f41dd05b6b20bf4483ff1840c87111ed22b2dd
3
+ size 104857600
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5ceec63edbdf04ea2cd6ba13f54dc3fe3c947c9f1b1d535d9a4f81582da5f61
3
+ size 31478784
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4059691746ffb982f18e33ce2578555b7d78f8775b92ef44d63552296f575532
3
+ size 52428800
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6d4f0d24a95d0e362800ecd2284d3eb7212d861d59063e3710831037325e366
3
+ size 104857600
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c31883ae81e12d5b2862766ba7e7800d7a8690fcb1e0b415bf0fa626d827ead
3
+ size 31478784
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0240f4e97e039ee7e12b829469a4fd13e10499361a08a3e684632f77243cf84
3
+ size 104857600
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8a69a9f98f599e0f4d4f3af48600a7d205a7bca52ee09322516f21f68b80895
3
+ size 31458304
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77398a98fb6eb98b0ed846569bd8b177d34de39782037c2bc30b5d434577bd8e
3
+ size 104857600
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6bd63745f609aa0cf3d12ca6243126e0cb59de0a8646d683da61809c4c9f842
3
+ size 52428800
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86e0718b1e918639bdc22bbaf24c47250a36608977c1539c3e7aab9ff090d575
3
+ size 104857600
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d9bbc1d443760d351fc9cda315881f1cd53e319f42733f8f5e14c7b319e055b
3
+ size 31478784
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d3ad676c2a21d5239c82ded6043d71f34070b5fdc4ac60c6e1171a80871b833
3
+ size 52428800
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcbe354a64e850285ce576874366c82efa76f3c4ada2631a408d40e24a8b18a2
3
+ size 104857600
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14b3c4aa0845185f3dfb83878a5f8b957f9668513c85347d031f0ebb90e496c9
3
+ size 31478784
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b0cd43a7357dd7e96f42ffbc071aaaaf2317cafde215056f735e3ccf1eb2c1
3
+ size 52428800
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffffa8d399f5775c01adb129de6e41a1bf0ef68c257b607edd86f1b5ba08c285
3
+ size 104857600
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1277e7a57a8218af5b88c46fe0650f705d71f5986dc61ca82655271acdf25b5e
3
+ size 31478784
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b55d286e860b0b4509141f756d7ee437b686b75e94191bebbcb2e9df28ac951
3
+ size 52428800
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17db69942cf24030261ecedfcc1fc474a313efeb03d559845e0941a4904f7d15
3
+ size 52428800
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c33ef84460d3d0589efcc3bdb9629679b32ceae102d33d34baabc36059f0e776
3
+ size 104857600
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7b08acebbc0c7e2b59b9e8ff99d6fe38ce2e8348947046cee042eaa2bb6a49d
3
+ size 31478784
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a6d4a265fb6215b0eaf2b45202c84945fbecd629de788c290865af03fc19a22
3
+ size 52428800
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f18017a281549c02b9546e464ec5acd94fef939cf7afe10f35701bded32d2b34
3
+ size 104857600
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f41319516ca266b2a70106a5d33ab8c28d39596b72638a4de7e8c4c13d6d7a3
3
+ size 31478784
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee453c416826c7ffcc9c2bdb0278bfd194f60e91b215882923f7638058af6ea4
3
+ size 52428800
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:300d77dd3a0aa4c1c5fa0049776b033cde62536277dea84989d8a6eb56ed9ca5
3
+ size 104857600
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b5157d7a45462009abfe5453d38bebb339ce988e810404ae4c6e4f9b900273f
3
+ size 31478784
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab990b235f9fb46615928c08edc689c12d35bd2f42670455af5cddcc6d4949e
3
+ size 52428800
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9672cb2e0dc426db767d84307291dd0c6b969f13dc2d188348436a5b3c3b172
3
+ size 104857600
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f0fc6e422dcb0a582dd42fa458d3c829fb67cae4ac79018f8db1a3f657ad84a
3
+ size 104857600
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1b5d241df0e1eb168fb1d19aa274c8b953e5f49469dbb3901cae6f9c19115bf
3
+ size 31478784
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22c66e1e132a61e2fccb31835e29201d7dde5bc38a801f6af79b57d678a22334
3
+ size 52428800
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eba5cfb4b676bb151b41d8664072741efd7bac184cd927c842df5a112872af4a
3
+ size 104857600
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5550a9f4373edd6bdf1a0c5f32aa1fbc632babde0e6869f8f72d9747c63e2636
3
+ size 31478784
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef548ea20a22548956f39e2c26c7d99c684a336a27c6dd3799a33dbc20234ee2
3
+ size 52428800
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d4e3f7f95b6513f289409cb3a1c826328c5195f404f973a335e2b5a247e4085
3
+ size 52428800
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6965b5250c6433c364b47a21d77b30afe5371ee4cccd7c0e9a3a1f8716dddd4f
3
+ size 104857600