Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +44 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,44 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "mixtral",
|
3 |
+
"quantization": "q3f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 14336,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 32,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 32000,
|
11 |
+
"position_embedding_base": 1000000.0,
|
12 |
+
"num_key_value_heads": 8,
|
13 |
+
"head_dim": 128,
|
14 |
+
"sliding_window_size": 4096,
|
15 |
+
"prefill_chunk_size": 4096,
|
16 |
+
"attention_sink_size": 4,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"num_local_experts": 8,
|
19 |
+
"num_experts_per_tok": 2
|
20 |
+
},
|
21 |
+
"vocab_size": 32000,
|
22 |
+
"context_window_size": -1,
|
23 |
+
"sliding_window_size": 4096,
|
24 |
+
"prefill_chunk_size": 4096,
|
25 |
+
"attention_sink_size": 4,
|
26 |
+
"tensor_parallel_shards": 1,
|
27 |
+
"max_batch_size": 80,
|
28 |
+
"mean_gen_len": 128,
|
29 |
+
"max_gen_len": 512,
|
30 |
+
"shift_fill_factor": 0.3,
|
31 |
+
"temperature": 0.7,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 0.95,
|
34 |
+
"conv_template": "LM",
|
35 |
+
"pad_token_id": 0,
|
36 |
+
"bos_token_id": 1,
|
37 |
+
"eos_token_id": 2,
|
38 |
+
"tokenizer_files": [
|
39 |
+
"tokenizer.model",
|
40 |
+
"tokenizer.json",
|
41 |
+
"tokenizer_config.json"
|
42 |
+
],
|
43 |
+
"version": "0.1.0"
|
44 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:694ad475a195826f9a48066ca52faaa807cd70b462f71e0858cd1103511d1faf
|
3 |
+
size 52736000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54ccd49ddeadd995fc7c55b3acba2dc9ed88f58a7afdf4ad59401d7100336021
|
3 |
+
size 378011648
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75b0b589536ebaad9764655cbae7ac797d4c9daff685c7705e8aa5634297ffe9
|
3 |
+
size 378011648
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:949a8bc70d6ee8e6dcc783cdea720d25ab8862e8f87b88c0eb6c7ecfd8194970
|
3 |
+
size 378011648
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e505ed4de57e0c1e8308d66fbf7947c5fef55ba30c6cc6444596df7a46cd824
|
3 |
+
size 47251456
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a47b11a842d35b9a06f80b43250a643aa5a7ca989cbcd150f5529db3158e83b
|
3 |
+
size 188219392
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2453e46f135aa935fe56367ba22380c2ad0422a375bc065860555ac082cc58dd
|
3 |
+
size 23527424
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a6624583bc9673032b7ed6982a345ffda25232a59a672619661af077d462cdb
|
3 |
+
size 30423536
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ec0f6286057025e89402cf506273fc7589fbc5843bfbd829d2219f50b930bf
|
3 |
+
size 378011648
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f37aabfa101b9b77d9e681ea95055b39f0dd69803af6eb9111fa5ed4afacc4
|
3 |
+
size 47251456
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fde7bb7400407aa7470c30dc4886d99cb65e1a940f37e982721c8fc19845ab6
|
3 |
+
size 188219392
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efff81b8a90c8cd45056d92a256e4d5cdbb1b53bddda48957ce7199879437018
|
3 |
+
size 31136240
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23b8bfbec071da9fd21e09b46fcfc138586450da1bd1ea708bf841777e936a64
|
3 |
+
size 378011648
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c3d5024556171fd268533b5b4c6e3ac13a12e26f1f5355076aa8703a3ad19c7
|
3 |
+
size 47251456
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:965c526dd520b3b1d2e20ea7594f0f532c0cb5c9c86dbe64ce1afc7acdcefb32
|
3 |
+
size 47251456
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dbfa6d03ecaed24e82e593865f813100bd78446e19b411d4dd2b5faad724b82
|
3 |
+
size 188219392
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f5d779d06edfa96e16decd127d915a1bbc618c88632322d38bdc46fdd4d2f3a
|
3 |
+
size 23527424
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bdbeff022067a2e69fd1746e3f91482301fcbc048d2a6fd723db6209c10a58f
|
3 |
+
size 30423536
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12b58eecaa5640b95d889e073a3e7d39884b0fca9d00bf07a524265d87937b27
|
3 |
+
size 378011648
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec4ffe22b70ebca596d95846d8cc765a86e94698aa6ead352c2cc82010d67dc2
|
3 |
+
size 47251456
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13fdae1568d9c8562f005127857d1324004fa4ea6b115e2aad49470270cfe782
|
3 |
+
size 188219392
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b2ac39d39d909af094bcaaf173344d964293a8e7bfafa1c72d86e700e970b31
|
3 |
+
size 31136240
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65c81186c3a15cb96af286c2f8aafcf796f7879adf929186a5655cf3513e563e
|
3 |
+
size 378011648
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ef2c56ab313450facdb469751c0999f9377e4731e03824f08e2458fe4f2cdf3
|
3 |
+
size 47251456
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86d84dc09fad42004376b6be2b020e76e206e4eedbe5b33429255c4ca4f12843
|
3 |
+
size 188219392
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c5ea12929a9663e3055f6e9c6a4e8e182a86e53cfde7070717f165892150c55
|
3 |
+
size 188219392
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e59e5cf98105fe38fba4680cd0d00a8bdbdd603af0cadd23a3b04460274fa2e8
|
3 |
+
size 23527424
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18b8ae8be922eb7627e6469f5a1a76fbed48b3f3cb591a5aa9865c6055d07d12
|
3 |
+
size 30407152
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dcfa2908a20d32bca25c19530bc1e44c03790d2b2e7e1c80f4ec11b8baf9c6e
|
3 |
+
size 378011648
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e06a2565fba013e2e587ee806dbbb54d34044528d334c4932277cba74068641
|
3 |
+
size 47251456
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:711fc15fe05596cff71f214b10ab68a0f0a37524db30477be3d08845da71d834
|
3 |
+
size 188219392
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5afc73995fd9d7df4fa9fc6dff556489bf3408a4a57d83d6cc712a030ab53394
|
3 |
+
size 31169008
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30903dd2e5fed005f58a3d06955d657e00b2990a3b225137c3c1eef4aee41912
|
3 |
+
size 30390768
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf992a611d8099017d9f863ed2ea0be7248c98c0b836227136f281026561d590
|
3 |
+
size 378011648
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10e93b7453c7cf318a131309768283b71fb8429ee638ab73e46ba7bf7f5407fb
|
3 |
+
size 47251456
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c528c9ade6bbdd665b80f60e160460dfc3abca72e1a688ba00a24d16341c14fd
|
3 |
+
size 23527424
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81e5699d96ac713afd3c3da4f03b38896f803de9f3ed05cdc9f3dc6b710b296f
|
3 |
+
size 188219392
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb84d625f10584fc0b314635efca8a28a8b8e649320ff539234365a0cf15a21c
|
3 |
+
size 31169008
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c9909419d075247f0bcf75168a475e7af8c5921cebca38d8fb444ec795bd0f3
|
3 |
+
size 30390768
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af7e9fdb327ad604f1d46c49584fe6585a208502da959b93cf7b63e21d78c8a9
|
3 |
+
size 378011648
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:224b99142632fc609d446100e21ad7dd589633ae98657673e4a8ea04165532be
|
3 |
+
size 47251456
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5112a53c06c00c3f6e3b4d071da340dfa8a33c79d018a6f292b5c038828b78d
|
3 |
+
size 188219392
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8193d2b58ddee9827f92c4e0c492697d12c1734940886cdb18dda1e97db694f4
|
3 |
+
size 378011648
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed4fa24f6cc4a8ceb5dd751e8692ea984cab990209bd4dc83dde12cde79c6add
|
3 |
+
size 47251456
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05bb6e528a1e01e766fe6faef3d4a71c9d8f68033cfff361c0632609ecf5b0a6
|
3 |
+
size 188219392
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:320f8c6e5684dc241f9f86ed64e0bda0a32326535ec592be5cf7ac95304e4de3
|
3 |
+
size 23527424
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d85ca006f18c6965350d155f31c6dfc08579a9807b0ad2107eca16609a402c93
|
3 |
+
size 25616368
|