Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +40 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q4f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 5120,
|
6 |
+
"intermediate_size": 13824,
|
7 |
+
"num_attention_heads": 40,
|
8 |
+
"num_hidden_layers": 40,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 51200,
|
11 |
+
"position_embedding_base": 10000,
|
12 |
+
"context_window_size": 8192,
|
13 |
+
"prefill_chunk_size": 8192,
|
14 |
+
"num_key_value_heads": 40,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1
|
17 |
+
},
|
18 |
+
"vocab_size": 51200,
|
19 |
+
"context_window_size": 8192,
|
20 |
+
"sliding_window_size": -1,
|
21 |
+
"prefill_chunk_size": 8192,
|
22 |
+
"attention_sink_size": -1,
|
23 |
+
"tensor_parallel_shards": 1,
|
24 |
+
"mean_gen_len": 128,
|
25 |
+
"max_gen_len": 512,
|
26 |
+
"shift_fill_factor": 0.3,
|
27 |
+
"temperature": 0.7,
|
28 |
+
"repetition_penalty": 1.0,
|
29 |
+
"top_p": 0.95,
|
30 |
+
"conv_template": "llama-2",
|
31 |
+
"pad_token_id": 0,
|
32 |
+
"bos_token_id": 1,
|
33 |
+
"eos_token_id": 2,
|
34 |
+
"tokenizer_files": [
|
35 |
+
"tokenizer.model",
|
36 |
+
"tokenizer.json",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"version": "0.1.0"
|
40 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:492553ddbcb6f467828f1ed4a08d18b344cc4099ab34586bd2081122bacbd4e2
|
3 |
+
size 131072000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44231b33c22413fbc336903f220e5538a672c232ef6622058950fe1a524b8e3a
|
3 |
+
size 35389440
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ac871dd1110ffa24c8fc197f194f0da75f1baa1ad14fa232d353b2afbf5a53f
|
3 |
+
size 39321600
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2af6b1137f59bcdcd6a3c96497ee4f46deade18c398d5e319bdba897ddfb1157
|
3 |
+
size 32952320
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:deb9ab4298f6a063ce980e839934388c67f592058a6816b829cf64b624c28d51
|
3 |
+
size 35389440
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f8641fbdcf38e3779c1d1f7bb8e09e8443b9d8b11ea6467ed99dcb83a0b1a44
|
3 |
+
size 70778880
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2730f11c3166e9d980bda9f021a1eddc8c06bfcb0991244d4923dd5bdd62cf7d
|
3 |
+
size 39321600
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:353e69b477be296a9547d4a3d93e589c57f1d5bc4c76ee60d187dbb864a2f8d6
|
3 |
+
size 32972800
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a05879ca86ad311bde9d62785577a0fe67cad2f94c718fb6752513c1f75a6fbe
|
3 |
+
size 35389440
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa7e368e59973016af461f82334a8f8d22524a444dec82168354183e764e1253
|
3 |
+
size 70778880
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a595f0da8bdbd2eb6a0e13117c6b07980b8c8507bef6c98fceaff6055c0232da
|
3 |
+
size 39321600
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7868a43f555f328492247621dd50771f5354102d6b2e56acc829c5ea16ad020e
|
3 |
+
size 32952320
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78878a0d214923a7b74b60a5fbe883acfcb27e7678d7e61d4b760fa58f9d4d5d
|
3 |
+
size 35389440
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c71c1ea59f1d2fcc70fba3d3147698ddf4a12666f9e399ed196d0440bc0af1f5
|
3 |
+
size 35389440
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5afd5a1e7dcac72092adeeea901b992acf538e72fa72ab0f7034a1f0a6dfa06
|
3 |
+
size 70778880
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51450c6a9303518664bb53be6a900e73cc2bb1271e352a3cb6733273c0902963
|
3 |
+
size 39321600
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26736bb4ac241ba3db7185f717713a087f215f64583d121992964ac14e6d4d0d
|
3 |
+
size 32952320
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89b5a877eadb05e6a755513ec037df1a6f0f2e6b9363f43b02add1145dbd9390
|
3 |
+
size 35389440
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e6b24092e774a2523cdc3248f8c9002daef33d7c1af1bcbaf530893cf8caebf
|
3 |
+
size 70778880
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62aa37e5f29e90e113b8988388f52e0ecee6cb6a8b320273821277230c56c2ed
|
3 |
+
size 39321600
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8861e09ad7cdefeeab6f157ee9c2d87c88a28af4e0463e1a8fea5d50e84ac549
|
3 |
+
size 32952320
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04d4086402f05ad587a5a0b9cc4e0743c99f6a414907d1b4bdd4625888d64857
|
3 |
+
size 35389440
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c1d86c92df7a11c1713362f09bc5c097e10fba7a3bcb2836bb200f629406d20
|
3 |
+
size 70778880
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca38b312487bb82d0bdb7ce830e73d11e4af5de707bc7ed008fe5e50be4b69da
|
3 |
+
size 39321600
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8e7a058f78c1b1f82efe62001f9b8d749aa822f8f0d1d62f9754f9e4375b6e2
|
3 |
+
size 32952320
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:699c5ca4bbac83427b869ce12dc9f9d66ef715e8b31ac26959639f91a0ecb431
|
3 |
+
size 32952320
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb8759cdf092dffb0005f36dcad0601a8d1a593e65b3301fc4e379e0495fe120
|
3 |
+
size 35389440
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21ad9cf99be485656556a99005daaf1fac0aab62724727926a289ad51a897704
|
3 |
+
size 70778880
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ea3f11e3acf97ce3308ce596f71c70b8f5f447b767b07e433c969a0e8643e91
|
3 |
+
size 39321600
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21244bf7a8d6ae247f46e7f012700307275ef900aa4ddd7eda1acb7efab5dd2b
|
3 |
+
size 32952320
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb24cf17530fc445ddc49342488d30f15a45c50211d3b376566dd8a9d72ecc5d
|
3 |
+
size 35389440
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e248f1e8043a8861ff3cf76b63745a288e8bf828c4a8c5191660699ff2833809
|
3 |
+
size 70778880
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27da96fde86f83e62dbed49c45129472534c312e53096acdf7c5e439330e91d9
|
3 |
+
size 39321600
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddb59287eda2f3928130cdbbfd769b3a96bb2fa1d65b53dffb4868f7c8693029
|
3 |
+
size 32952320
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea5457e43bbb4245b053b9c62c36551f0396f26828ec4e7c9ba399c3337568b9
|
3 |
+
size 35389440
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7329d25ca4cf1a8eb765c0271155dc7a35d62198a592890f08ab3590d139c48
|
3 |
+
size 70778880
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2a2182cd62a28b30a67d600eeeb54b4aa14b982f2d3600bec1d4f4b0ce3eec0
|
3 |
+
size 70778880
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb77a0eb9d75b443c920b501938048c78308d2e2b22fbf2d3cf5214641db97c6
|
3 |
+
size 39321600
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:114b28c0f703f49276999d9f51dcaded3d203807709fce2509a7da6d89721dbd
|
3 |
+
size 32952320
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67d5f5546188b41816bed58443b7a107981be036875156109fa1fca490150530
|
3 |
+
size 35389440
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65f32bcd62a5e2b6d6cbb1e63e28c8d0856910a79a1a2e087a5eb010ff8462f2
|
3 |
+
size 70778880
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf3e0fa89a2adf5a511700ebeacf1d850d4c8334951445017c477f0b68c26e05
|
3 |
+
size 39321600
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8af8d4f4f6c909ac873ca1763eac16ec211f0c0ee84b728cb59a66f9d1b72e1
|
3 |
+
size 32952320
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69bf58f38b7d3dfac7874b310b20c8df52e5db0bc0bd06352742b96189cd4d0a
|
3 |
+
size 35389440
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:235f1065e80940ffece98b00c1ae4fc2d645956d5d2904df23f23ff51a8f66c9
|
3 |
+
size 70778880
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82119494c1b5750195f9b6684de564ac21ff15c38456c7c998d5214199240a53
|
3 |
+
size 39321600
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd1731afcc9ee9ae76f03c59b62c0ab85fe52b10616b60b88d38e0de9dfc279c
|
3 |
+
size 39321600
|