Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- added_tokens.json +3 -0
- logs.txt +0 -0
- mlc-chat-config.json +42 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<step>": 32015
|
3 |
+
}
|
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q4f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 8192,
|
6 |
+
"intermediate_size": 28672,
|
7 |
+
"num_attention_heads": 64,
|
8 |
+
"num_hidden_layers": 80,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 32016,
|
11 |
+
"position_embedding_base": 10000,
|
12 |
+
"context_window_size": 16384,
|
13 |
+
"prefill_chunk_size": 4096,
|
14 |
+
"num_key_value_heads": 8,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 32016,
|
20 |
+
"context_window_size": 16384,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 4096,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 0.95,
|
31 |
+
"conv_template": "codellama_instruct",
|
32 |
+
"pad_token_id": 0,
|
33 |
+
"bos_token_id": 1,
|
34 |
+
"eos_token_id": 2,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.model",
|
37 |
+
"tokenizer.json",
|
38 |
+
"added_tokens.json",
|
39 |
+
"tokenizer_config.json"
|
40 |
+
],
|
41 |
+
"version": "0.1.0"
|
42 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ed05051bd806eda7b9d79448d054b61a3150c7a960fe0eaaaa66fcad0bc55c
|
3 |
+
size 131137536
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b87f6858612633ba767c5be5b2348874813a620b51a43f139d82963813996b19
|
3 |
+
size 117440512
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f279a645f0abb1a0147453ece55af207517e33e9f6737f4b8bd947d810635a1b
|
3 |
+
size 33554432
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a192b384ed489ab231ac278a1f1ec469c5d16ef43a4eab8824f155b1c9998b3
|
3 |
+
size 18923520
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c31a4b1d6f54bd2b3ca85da3d478c18aafe180cc57b86864e3e3199d4ce65cd
|
3 |
+
size 234881024
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b53cbb2606f3720a160fc403db10469b0666337db659daec6330407113584a5e
|
3 |
+
size 29360128
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32cf7b21e8b4065e34d6f868cc1e69d010e430716a54034895c48bd83396ca5f
|
3 |
+
size 41943040
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dc8203b3377d0c7b50229aee682252c672db19fe17c330d1242297fbc21b197
|
3 |
+
size 33554432
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afbb9969aa45dfe225bb31173893769420052edc6ea7ca60a1aff005d953d559
|
3 |
+
size 117440512
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f430b72e4621868ce30dde2afba010785b5546791cc5c4131656476578a67a92
|
3 |
+
size 24150016
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8165a8f8ca456d5fe70a4cd54849d8130cb036e2c7939651493b215aee3b8dcb
|
3 |
+
size 234881024
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b414c67be45fa6747a4bbb0d3e7492ea6439c7dbf16b94358e663256ac795f2f
|
3 |
+
size 29360128
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbd15247aa191bc54595bba5db1a5517126410c814bb35c4ea6fa5357a54bed5
|
3 |
+
size 41943040
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2add42fd7d61018e8b6ac221899dab4fd3033625a4590d708526a11bd93ef1d7
|
3 |
+
size 131137536
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f34f0a77b8a113209b3d867dca26920249054b047f2f6a5fdd7b06b5d77b8d07
|
3 |
+
size 33554432
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5955a0acd2bc92636e6a1cb8fd9f1ae59992ab731c837c31d194c96cbda53c7
|
3 |
+
size 41943040
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad491d3f52365ca4e33a151059974bf5ca119e689b1fd4a0583c72542da8bcf4
|
3 |
+
size 117440512
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c81813ddb43f624fcc21d2da58b211621b8c82bfca983e555439252222a520f
|
3 |
+
size 29392896
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d69a058b28b1f823aae75072e29396698c8d9fabfec412315b7dbb538b63000
|
3 |
+
size 117440512
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:011dc5d22a53c6d02c9f263fd261d4383786909f48400cdf60860e925039a841
|
3 |
+
size 234881024
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9281667f9100b177d39c8fbd05847879527f9cfd2010e040ccfb0430e601b936
|
3 |
+
size 29360128
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2043ea1b2ad82765a2e1672ae56bd22511eec729ca36419c8d3056548cbb379c
|
3 |
+
size 41943040
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6937818a8e14cf465591106c67e9f7827df51a20d0693133747ae2eaab17098a
|
3 |
+
size 29409280
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:904ea1fbd1ac6ba0af2f6639a581e4adfa4fcc21c2ad709133472f4b61e3e248
|
3 |
+
size 33554432
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78851ef93b2957f8e49ab35b8cef8c5214fe52bcc37d53f81558b802c0e392b5
|
3 |
+
size 28360704
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2e9c51e77d7f7bb6c493e61e570a51104ce99cbf7db4b7202b735acb6fe8b9d
|
3 |
+
size 117440512
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34d82695d17f2755be793e237fd358955fdfa0ae9b75f29b1013618d660f4b3d
|
3 |
+
size 234881024
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bd87ee12a5755e5d8baa15359cda21d55b67a9abdbd9d49d3400eab8342fffa
|
3 |
+
size 29360128
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db571f38df068b4dac36979f2b0e2c16143004c96f953fbb7efa5d6449d9cf65
|
3 |
+
size 41943040
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb151c61db7eac587aa36ebba30a1d0dc0f317639bf011b011d4b9bad883f0f4
|
3 |
+
size 33554432
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cac6828d7ff74eaafbd99d26dae5cc200a29bb4ae437be4ebb9375833cef5d1
|
3 |
+
size 29392896
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90c5d234fe46340cb88ab0a1fdbecca890be448b74872f54a99724624bc8d9f4
|
3 |
+
size 41943040
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3136c62f1137fef1962888a9537085ac95dac4c96f93b2c01ccfb342e4ac58b3
|
3 |
+
size 33554432
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70da928478d886ec48d632531526704fe95a8322ec9d134eadb439a61f7c05ce
|
3 |
+
size 117440512
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00331ee81be33a36c24762bb3025dc310947c359fe3f67835c0c61945c0d5ca5
|
3 |
+
size 234881024
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4b8d2497cde7ed05cf37bdb704a479c2c03281b753bf66bac7e475f6bdd042c
|
3 |
+
size 117440512
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aef254e7e2fba457bacd104b136a85aa1561ca865ac818797764faba5332e0cd
|
3 |
+
size 29360128
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f6b2353fa0203e1992170465b6667506cea1b63af1f3c4b88bf579d063fc24f
|
3 |
+
size 33554432
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a42f867b659f061f21e0f409e1c3d84dcfcabd2a7738ffe55e59ef5d530162df
|
3 |
+
size 117440512
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7732e947dbab93f193cc15bf4d5971066feb7a2cec7858357dc5b5bf43d7878
|
3 |
+
size 32555008
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8f9071f47172de5676818338351a294aaee9b8e187d6c7b3d5f5b744dbf60cb
|
3 |
+
size 234881024
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe66af95c605aff9e30be282195fb4f037f040c240209f3d05caf8fecee73f69
|
3 |
+
size 29360128
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d74d7580f766f95fb5670658571adab7e4653771a841fad8a45ff7f24a238d81
|
3 |
+
size 41943040
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27e7062d434309195247418a4b7cfef81a6040d284a7b82b715bc5d0b02c0619
|
3 |
+
size 33554432
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6eec337c20a1fa511f602150f5f939cea62c19753becddc0c1201867277cf9bc
|
3 |
+
size 117440512
|