Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- added_tokens.json +3 -0
- mlc-chat-config.json +99 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<image_soft_token>": 262144
|
3 |
+
}
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "gemma3",
|
4 |
+
"quantization": "q0f32",
|
5 |
+
"model_config": {
|
6 |
+
"text_config": {
|
7 |
+
"hidden_size": 2560,
|
8 |
+
"intermediate_size": 10240,
|
9 |
+
"num_hidden_layers": 34,
|
10 |
+
"attention_bias": false,
|
11 |
+
"num_attention_heads": 8,
|
12 |
+
"num_key_value_heads": 4,
|
13 |
+
"head_dim": 256,
|
14 |
+
"rms_norm_eps": 1e-06,
|
15 |
+
"hidden_activation": "gelu_pytorch_tanh",
|
16 |
+
"position_embedding_base": 10000,
|
17 |
+
"context_window_size": 8192,
|
18 |
+
"prefill_chunk_size": 8192,
|
19 |
+
"query_pre_attn_scalar": 256,
|
20 |
+
"sliding_window": 1024,
|
21 |
+
"kwargs": {
|
22 |
+
"model_type": "gemma3_text",
|
23 |
+
"rope_scaling": {
|
24 |
+
"factor": 8.0,
|
25 |
+
"rope_type": "linear"
|
26 |
+
}
|
27 |
+
}
|
28 |
+
},
|
29 |
+
"vocab_size": 262208,
|
30 |
+
"tensor_parallel_shards": 1,
|
31 |
+
"max_batch_size": 128,
|
32 |
+
"context_window_size": 8192,
|
33 |
+
"sliding_window_size": -1,
|
34 |
+
"prefill_chunk_size": 8192,
|
35 |
+
"is_text_model": false
|
36 |
+
},
|
37 |
+
"vocab_size": 262208,
|
38 |
+
"context_window_size": 8192,
|
39 |
+
"sliding_window_size": -1,
|
40 |
+
"prefill_chunk_size": 8192,
|
41 |
+
"attention_sink_size": -1,
|
42 |
+
"tensor_parallel_shards": 1,
|
43 |
+
"pipeline_parallel_stages": 1,
|
44 |
+
"temperature": 1.0,
|
45 |
+
"presence_penalty": 0.0,
|
46 |
+
"frequency_penalty": 0.0,
|
47 |
+
"repetition_penalty": 1.0,
|
48 |
+
"top_p": 0.95,
|
49 |
+
"tokenizer_files": [
|
50 |
+
"tokenizer.model",
|
51 |
+
"tokenizer.json",
|
52 |
+
"added_tokens.json",
|
53 |
+
"tokenizer_config.json"
|
54 |
+
],
|
55 |
+
"tokenizer_info": {
|
56 |
+
"token_postproc_method": "byte_fallback",
|
57 |
+
"prepend_space_in_encode": false,
|
58 |
+
"strip_space_in_decode": false
|
59 |
+
},
|
60 |
+
"conv_template": {
|
61 |
+
"name": "gemma_instruction",
|
62 |
+
"system_template": "{system_message}",
|
63 |
+
"system_message": "",
|
64 |
+
"system_prefix_token_ids": [
|
65 |
+
2
|
66 |
+
],
|
67 |
+
"add_role_after_system_message": true,
|
68 |
+
"roles": {
|
69 |
+
"user": "<start_of_turn>user",
|
70 |
+
"assistant": "<start_of_turn>model"
|
71 |
+
},
|
72 |
+
"role_templates": {
|
73 |
+
"user": "{user_message}",
|
74 |
+
"assistant": "{assistant_message}",
|
75 |
+
"tool": "{tool_message}"
|
76 |
+
},
|
77 |
+
"messages": [],
|
78 |
+
"seps": [
|
79 |
+
"<end_of_turn>\n"
|
80 |
+
],
|
81 |
+
"role_content_sep": "\n",
|
82 |
+
"role_empty_sep": "\n",
|
83 |
+
"stop_str": [
|
84 |
+
"<end_of_turn>"
|
85 |
+
],
|
86 |
+
"stop_token_ids": [
|
87 |
+
1,
|
88 |
+
107
|
89 |
+
],
|
90 |
+
"function_string": "",
|
91 |
+
"use_function_calling": false
|
92 |
+
},
|
93 |
+
"pad_token_id": 0,
|
94 |
+
"bos_token_id": 2,
|
95 |
+
"eos_token_id": [
|
96 |
+
1,
|
97 |
+
106
|
98 |
+
]
|
99 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84a56ee03e66003602b56de104e739e89bac4cdb374237ba90ae88813badfe65
|
3 |
+
size 1342504960
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5499f2f069f5ac1bc309d802d3f75191cf7da41d7489a57790e4720abbbb897
|
3 |
+
size 52428800
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78fd168e73131a0aa5058faff5d23034bd44888a3beab6fecce5cbd3b677b868
|
3 |
+
size 104857600
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1659b99d8ae756e27c4f7cc0f169f98e35a245fa29b481352a6591f580586ab4
|
3 |
+
size 104857600
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93a48a48318e5dd33926858e73d6927f5bf4e223a2f9b55c8d5f1839814aba05
|
3 |
+
size 31478784
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a024fc6e5e60783b5d1732c047e86d722bee1ecb4803856942351ab9b457f177
|
3 |
+
size 31462912
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beba06e746ffc6461be1fd2b0f43b28d076cac39b2d93dc7b7d7e6e02b1360e1
|
3 |
+
size 31478784
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d351ebdabffc75fa649799626527797955c44a86840c26a5037dc01cad4be0a
|
3 |
+
size 52428800
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14a9082bc21960f26c73e9ce50f41dd05b6b20bf4483ff1840c87111ed22b2dd
|
3 |
+
size 104857600
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5ceec63edbdf04ea2cd6ba13f54dc3fe3c947c9f1b1d535d9a4f81582da5f61
|
3 |
+
size 31478784
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4059691746ffb982f18e33ce2578555b7d78f8775b92ef44d63552296f575532
|
3 |
+
size 52428800
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6d4f0d24a95d0e362800ecd2284d3eb7212d861d59063e3710831037325e366
|
3 |
+
size 104857600
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c31883ae81e12d5b2862766ba7e7800d7a8690fcb1e0b415bf0fa626d827ead
|
3 |
+
size 31478784
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0240f4e97e039ee7e12b829469a4fd13e10499361a08a3e684632f77243cf84
|
3 |
+
size 104857600
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8a69a9f98f599e0f4d4f3af48600a7d205a7bca52ee09322516f21f68b80895
|
3 |
+
size 31458304
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77398a98fb6eb98b0ed846569bd8b177d34de39782037c2bc30b5d434577bd8e
|
3 |
+
size 104857600
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6bd63745f609aa0cf3d12ca6243126e0cb59de0a8646d683da61809c4c9f842
|
3 |
+
size 52428800
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86e0718b1e918639bdc22bbaf24c47250a36608977c1539c3e7aab9ff090d575
|
3 |
+
size 104857600
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d9bbc1d443760d351fc9cda315881f1cd53e319f42733f8f5e14c7b319e055b
|
3 |
+
size 31478784
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d3ad676c2a21d5239c82ded6043d71f34070b5fdc4ac60c6e1171a80871b833
|
3 |
+
size 52428800
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcbe354a64e850285ce576874366c82efa76f3c4ada2631a408d40e24a8b18a2
|
3 |
+
size 104857600
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14b3c4aa0845185f3dfb83878a5f8b957f9668513c85347d031f0ebb90e496c9
|
3 |
+
size 31478784
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b0cd43a7357dd7e96f42ffbc071aaaaf2317cafde215056f735e3ccf1eb2c1
|
3 |
+
size 52428800
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffffa8d399f5775c01adb129de6e41a1bf0ef68c257b607edd86f1b5ba08c285
|
3 |
+
size 104857600
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1277e7a57a8218af5b88c46fe0650f705d71f5986dc61ca82655271acdf25b5e
|
3 |
+
size 31478784
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b55d286e860b0b4509141f756d7ee437b686b75e94191bebbcb2e9df28ac951
|
3 |
+
size 52428800
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17db69942cf24030261ecedfcc1fc474a313efeb03d559845e0941a4904f7d15
|
3 |
+
size 52428800
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c33ef84460d3d0589efcc3bdb9629679b32ceae102d33d34baabc36059f0e776
|
3 |
+
size 104857600
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7b08acebbc0c7e2b59b9e8ff99d6fe38ce2e8348947046cee042eaa2bb6a49d
|
3 |
+
size 31478784
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a6d4a265fb6215b0eaf2b45202c84945fbecd629de788c290865af03fc19a22
|
3 |
+
size 52428800
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f18017a281549c02b9546e464ec5acd94fef939cf7afe10f35701bded32d2b34
|
3 |
+
size 104857600
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f41319516ca266b2a70106a5d33ab8c28d39596b72638a4de7e8c4c13d6d7a3
|
3 |
+
size 31478784
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee453c416826c7ffcc9c2bdb0278bfd194f60e91b215882923f7638058af6ea4
|
3 |
+
size 52428800
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:300d77dd3a0aa4c1c5fa0049776b033cde62536277dea84989d8a6eb56ed9ca5
|
3 |
+
size 104857600
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b5157d7a45462009abfe5453d38bebb339ce988e810404ae4c6e4f9b900273f
|
3 |
+
size 31478784
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aab990b235f9fb46615928c08edc689c12d35bd2f42670455af5cddcc6d4949e
|
3 |
+
size 52428800
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9672cb2e0dc426db767d84307291dd0c6b969f13dc2d188348436a5b3c3b172
|
3 |
+
size 104857600
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f0fc6e422dcb0a582dd42fa458d3c829fb67cae4ac79018f8db1a3f657ad84a
|
3 |
+
size 104857600
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1b5d241df0e1eb168fb1d19aa274c8b953e5f49469dbb3901cae6f9c19115bf
|
3 |
+
size 31478784
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22c66e1e132a61e2fccb31835e29201d7dde5bc38a801f6af79b57d678a22334
|
3 |
+
size 52428800
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eba5cfb4b676bb151b41d8664072741efd7bac184cd927c842df5a112872af4a
|
3 |
+
size 104857600
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5550a9f4373edd6bdf1a0c5f32aa1fbc632babde0e6869f8f72d9747c63e2636
|
3 |
+
size 31478784
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef548ea20a22548956f39e2c26c7d99c684a336a27c6dd3799a33dbc20234ee2
|
3 |
+
size 52428800
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d4e3f7f95b6513f289409cb3a1c826328c5195f404f973a335e2b5a247e4085
|
3 |
+
size 52428800
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6965b5250c6433c364b47a21d77b30afe5371ee4cccd7c0e9a3a1f8716dddd4f
|
3 |
+
size 104857600
|