Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +42 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_neox",
|
3 |
+
"quantization": "q4f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"use_parallel_residual": true,
|
6 |
+
"hidden_size": 2560,
|
7 |
+
"intermediate_size": 10240,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"layer_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 49152,
|
12 |
+
"rotary_pct": 0.25,
|
13 |
+
"position_embedding_base": 10000,
|
14 |
+
"context_window_size": 4096,
|
15 |
+
"head_dim": 80,
|
16 |
+
"prefill_chunk_size": 4096,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"ffn_out_dtype": "float32"
|
19 |
+
},
|
20 |
+
"vocab_size": 49152,
|
21 |
+
"context_window_size": 4096,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 4096,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"max_batch_size": 80,
|
27 |
+
"mean_gen_len": 128,
|
28 |
+
"max_gen_len": 512,
|
29 |
+
"shift_fill_factor": 0.3,
|
30 |
+
"temperature": 0.7,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": "stablecode_instruct",
|
34 |
+
"pad_token_id": 0,
|
35 |
+
"bos_token_id": 0,
|
36 |
+
"eos_token_id": 0,
|
37 |
+
"tokenizer_files": [
|
38 |
+
"tokenizer.json",
|
39 |
+
"tokenizer_config.json"
|
40 |
+
],
|
41 |
+
"version": "0.1.0"
|
42 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f82892d0ba5f5309831d04362cb7f70576c2087e4a88b5883eb31c83135a2a2
|
3 |
+
size 62914560
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a89657456baf764ffbd7eea540b85c433d736cf77647149ce66ea1b7aea38866
|
3 |
+
size 22650880
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4971f8286636bdb75062d0c9172736c3e1beb05d0cc0581c4117ff421ebb816b
|
3 |
+
size 29537280
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:433662c03d7f3a46109c37b574c1d8008b10289df93cbc72391abb5cd952cb35
|
3 |
+
size 29537280
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e48121a6cb16e0ff050c73331b485d80e1ba6c61e4529a531c5d2360e2ff60d0
|
3 |
+
size 29532160
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf73e3ffca1becce4ddb20fc8e96647ec6ed3ccdfba64ed42f86d79d3f29c14c
|
3 |
+
size 29537280
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db0ac9306bf4f668a9dd7ee19f700c96123cc455f228cbd6fc91d1cdc63a7fd9
|
3 |
+
size 29537280
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3fbf9a5385a153cf3a0c38dda75bcfd7d475c9c0117c12b6a2d5bf43f30645
|
3 |
+
size 29532160
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09a39f311d4da0205517fa258e356901373a5bb42b60eafceda1dd6a871cc1ac
|
3 |
+
size 29537280
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d57ff73428e4cd70c8f490062cc4d1e2c08197fc1915e425411afb53b66639f
|
3 |
+
size 29537280
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7b5a00a94f0f3d040fecd66fcc0c20e63676bd4e85d38592866449ea82ecf11
|
3 |
+
size 29532160
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:757f5e904e6596f54aa42c29cbfe49ee4a998e1be9f61426f50055c6e8064b3a
|
3 |
+
size 29537280
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38755466489df3ebd51eb546ec74c2b65573ae88f2e3b7f14a33d66fa70008d9
|
3 |
+
size 29537280
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea730f3f2365d5333dcb94c71c1a23ccf5c6efde56885223f8c3f0cc7b7e4647
|
3 |
+
size 29537280
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f85be4d1a46604bc1151f7c61c6c43a7dbc7b7969224669ca0b4270988d3e7fb
|
3 |
+
size 29532160
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:192d121a46e33021117de119de50606aa378af175174578cf736dc5ebb440478
|
3 |
+
size 29537280
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dce76584bd9bc9dd1efe54005377c9c2384ff98438e71454e2245a67781eab2a
|
3 |
+
size 29537280
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbca9bdfbeef416249598f7c1195f68dd4e3c1200d85148c8dc117c96e325597
|
3 |
+
size 29532160
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a114f0a71de03dcff78a09f5e04eafb422d6248a61c9dc01a6a6ea977b0a158
|
3 |
+
size 29537280
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:148d706d0e2bd32f798a97f43182dddccb26b6d847b8e749cb5bb04866722a00
|
3 |
+
size 29537280
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e03222a79080f20a1aeb87d65a530568692d1a923a26038b82fb329e8dc2c74
|
3 |
+
size 29532160
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:707b77a32097c5ead806bd8e5a46cee067adc4f342d1507d9f8f3577be318cc3
|
3 |
+
size 29537280
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b73e853952299cb77da25c0d09f0afb5f5b392507c3655d76e66dc94668661a1
|
3 |
+
size 29537280
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d3e5a360667fe4bb4a4b81868510985265d8179fbec7ccd612ebf1eb4ca776d
|
3 |
+
size 29532160
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a02ec1ad3394476169c825b676649a5af40a28fd61997071806ed8d411481c9
|
3 |
+
size 29532160
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0eea8bf0d7b958552f65eda084fb98c0f9700e630e613784cba5db45f59c514
|
3 |
+
size 29537280
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c396c5f8a3cb898b7cfd8bd8501d69014e69e9075270e01cfe9416ebf0cd691
|
3 |
+
size 29537280
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15ec0aaa5f273351a7d9d62195f8f12d7ae5d9537a864dcd51d0abe98ff36553
|
3 |
+
size 29532160
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c4e7898049de58a46fe91dbd81cb81a9c00afb9dba17b4eee68e78ff917514b
|
3 |
+
size 29537280
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:089e12646c1791e105777c9226f2e28419f6b31802922572f020c6513b3b14de
|
3 |
+
size 29537280
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bf0d75772a7b64908ff7719defa3ec9cd820e43183bb47f3d30ec6b77a0862f
|
3 |
+
size 29532160
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:919d1edaefe8b9350d433dedca3e9980d29f4fb16c6cbd912f90daa8e5bb1be9
|
3 |
+
size 29537280
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d20a959b5c7a718f9106331e07372922a3885a3287ebbc908310d57271cf7446
|
3 |
+
size 29537280
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9217c1bf0f1187d960210a841a180d1419bdaf8b7f05e9d92cb0f6116d401f2
|
3 |
+
size 29532160
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae935a2201fa254f408ee044b06fd4f2839394f35d3798150941dcd543069af8
|
3 |
+
size 29537280
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:275e29080b09e614536aa9ac069230567fca51863ad7d50aeceb447bbd81c505
|
3 |
+
size 29537280
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cab72eb28c699d7c2af22c390910cafc7abc6be4d2588a47196a58b7a3a09b8c
|
3 |
+
size 29537280
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe37cb6a4dc8063c72e599e6edb7f67c1599a3249a79f7d241ba66505c0b2d30
|
3 |
+
size 29532160
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3c6b6c34908965f6f3bfd2dd467a8f1bdf85844c91eedb9b48a6da7633253dd
|
3 |
+
size 29537280
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3252ccac677dcb2c4d40633057ceb3421804571bb24b33f09725fb9d6d4b4550
|
3 |
+
size 29537280
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f33c8156feb1937f9fb78ef0cee819c3d4a731eca05c903434a87de402eb336a
|
3 |
+
size 29532160
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:322b49ea61c669bcaa87fb8a7cdfd4e7a5a3de65fdb5be997cde1aad06a30022
|
3 |
+
size 29537280
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1b0e1eb46c5f0ac5cddcf0e1727e13bfe6e97caa0f6d6985065311e8045b313
|
3 |
+
size 29537280
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f457b9218f0c6b09bf27954d630b819a7f7d1c9a09ac5facddc68f2f35b95da
|
3 |
+
size 29532160
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5f6619f0b16f4aa9a6ef156a3e0a24522e43ab2266484cfc33f9102f2f96f4b
|
3 |
+
size 62914560
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c61e64640718929a18b3ee6f5e7cf26145032fdca1b7c3cf39f67d4147229eff
|
3 |
+
size 29537280
|