Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +71 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q8f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 11008,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 32,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 32016,
|
11 |
+
"position_embedding_base": 1000000,
|
12 |
+
"context_window_size": 16384,
|
13 |
+
"prefill_chunk_size": 16384,
|
14 |
+
"num_key_value_heads": 32,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 32016,
|
20 |
+
"context_window_size": 16384,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 16384,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "llama-2",
|
35 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n ",
|
36 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
37 |
+
"roles": {
|
38 |
+
"user": "[INST]",
|
39 |
+
"assistant": "[/INST]",
|
40 |
+
"tool": "[INST]"
|
41 |
+
},
|
42 |
+
"role_templates": {
|
43 |
+
"user": "{user_message}",
|
44 |
+
"assistant": "{assistant_message}",
|
45 |
+
"tool": "{tool_message}"
|
46 |
+
},
|
47 |
+
"messages": [],
|
48 |
+
"seps": [
|
49 |
+
" "
|
50 |
+
],
|
51 |
+
"role_content_sep": " ",
|
52 |
+
"role_empty_sep": " ",
|
53 |
+
"stop_str": [
|
54 |
+
"[INST]"
|
55 |
+
],
|
56 |
+
"stop_token_ids": [
|
57 |
+
2
|
58 |
+
],
|
59 |
+
"function_string": "",
|
60 |
+
"use_function_calling": false
|
61 |
+
},
|
62 |
+
"pad_token_id": 0,
|
63 |
+
"bos_token_id": 1,
|
64 |
+
"eos_token_id": 2,
|
65 |
+
"tokenizer_files": [
|
66 |
+
"tokenizer.model",
|
67 |
+
"tokenizer.json",
|
68 |
+
"tokenizer_config.json"
|
69 |
+
],
|
70 |
+
"version": "0.1.0"
|
71 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a20068b7c0a56abf3c1071545f038422bfc7fa7092bbab38e7efbb5055a858ed
|
3 |
+
size 131137536
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8b26b65dbfceeca6ed7c5109b41f642b0816299a095d4b5896e85b4e84ca4bd
|
3 |
+
size 131137536
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db58f17606085f9070187ae7ddae9a3b1da70ed744b6fd3bb1c8f5da5fdc4df5
|
3 |
+
size 45088768
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0da421fb4b87561f34af89e68685152d675d11ea538bade3828f641dbc4b64c
|
3 |
+
size 90177536
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c6e44b84c19e5597388e728af11dab88def7106e1978e0ccf1f970b92c15738
|
3 |
+
size 29442048
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a41e11820d0b0d17ced197bfdf6b9f73872088badd49578eb3e49c72de60fbf
|
3 |
+
size 45088768
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c54fc633945968a5da16b4a4c52a595e9985405b0673e79eb24ac2138c97f06
|
3 |
+
size 50331648
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a5b9b1a1ca1133ca5bcefb298a70a8f6bf693615018023d9fe6c719feef8e8e
|
3 |
+
size 90177536
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7248dd0d2066254d36884d846e6c3a70dbbfbdbb2445c154b5c5c362d064eb05
|
3 |
+
size 29442048
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e725d11afee1c25e3b116a5998e562ef6d8a877e26f206dda402980bd2f2457
|
3 |
+
size 45088768
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb199cf403b3073dc55418489a06d87700700921b658dff079514aab35f96839
|
3 |
+
size 50331648
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eade04125bb48c91e54ac1be741c60c011806420a41c08d19170d99d50826f7
|
3 |
+
size 90177536
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4b395cc8d66a59b09ab4f40e497e028e68e918d62d70897324b6d77e38b7387
|
3 |
+
size 29442048
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:187205cab4bc8adad1474b849a0c9ed59497f4c1df97c22b08c59bb8c8a98cc1
|
3 |
+
size 50331648
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:458cadba6a2129fd52a61cd81af9e9ff26da000bb7b44bda6136d1639de38140
|
3 |
+
size 45088768
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd265010dbbab80f5af71c3f56d1e448093b3c3ead21c72b8337557e72b0f4e0
|
3 |
+
size 50331648
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc19d184e1259eaa6fcf7d252ec756cbe152612ac716f54c2f5fff589df04ad5
|
3 |
+
size 90177536
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c04b06d0feb225f896be62acb4310986ce403427117e38b5415ac9d34d91878
|
3 |
+
size 29442048
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0486066d5ea84cc0862c757cef2db4831de056ba57fc6c42dcd262a4690ee1c
|
3 |
+
size 45088768
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03799249f408019436bc55617313db182621e479a64173ac7eaf83621a5a882e
|
3 |
+
size 50331648
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2cd0af2242793c2fed53d5f1622d20440527165312c52cf6d99aaa0e1d4973
|
3 |
+
size 90177536
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54b9d7e81e327b4b93d0caedbd851f147918709641ae85e666360899e809b79a
|
3 |
+
size 29442048
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57de7aa2f4a408ebace55f81ecaee25edc1af4fc3a4aafe6e5da96dac5872ddc
|
3 |
+
size 45088768
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:306d96d8572995c1602dcfb01814cd6718a43c535494e6a824e863ee8f80e5a3
|
3 |
+
size 50331648
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8301c8554128455978d3cd25c05d3880b6375cb7bbe478b1689e36799ce07b72
|
3 |
+
size 90177536
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3597ebecd92455d594acb30665ac12d68c25fe356204e3c39eca62c7f2021a1e
|
3 |
+
size 90177536
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7af395883fef365aba76c7947be331c171c4a1a56c2209f157e715729cac7435
|
3 |
+
size 29442048
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f575b95a1638d18b23217a69d9cdc8f6c3ca8739a025e2e445e0fc3fcb555a23
|
3 |
+
size 45088768
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0ca3e45bf1a437ebe4f7f210019d9fc55c96dc5d48b295d24ad399ad614b8e2
|
3 |
+
size 50331648
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df2f83e1dff71e6d252018b821079cd513e31414960de0db06fc43a4c6aad12e
|
3 |
+
size 90177536
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5aabeca778d515c96b1833d7869070be261ed00d86b41824f3df386584d5c10c
|
3 |
+
size 29442048
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c5e0733fad95328171e5e611abe59ff05a6f3054686fade5489c71db737e437
|
3 |
+
size 45088768
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1edff3e5a99fb02a4bc126bbb57c15436fe2dee8387546a30737d767812bb836
|
3 |
+
size 50331648
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7be04f5c6b35bc4bc392f9f7670ddc6609fb5ce192c1c8aa89f93eeeba7af21d
|
3 |
+
size 90177536
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4b1878e630423a10d282ae13ae948054d7dda556b37390f9363c4e6a7bfcf51
|
3 |
+
size 29442048
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a88179c18af91cff1df0c33011c31ed7052b633d5eb4076f729e1a0bd91703b
|
3 |
+
size 29442048
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52d56c0a9cd5952fde3b793ce117968d1e680e14e09d87f42313a26021283f91
|
3 |
+
size 45088768
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d40d88b6c49a9240bc1230961b5451a280a0e77ff9b6bac1a6277e1e71275503
|
3 |
+
size 8454144
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b62534e4c273d7529b982a45666e2ccd41fe7087efd7266ee87c885df00d2ec
|
3 |
+
size 45088768
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5427336198e10328ca02990956dff9e371ff28edec3de3f83c024bea39be38a6
|
3 |
+
size 50331648
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b53d29519e8acea2748cd85891db589152097644e884c67e67bde29c990fa00c
|
3 |
+
size 90177536
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2467439f36178c39b29e97cb785e6ea6ea9b2213eac828be8c57fb90d91440b1
|
3 |
+
size 29442048
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3df6f5b716a98b6cda615426b3464aaa670ced8af34ee7f8b3697b4ab8b9b69e
|
3 |
+
size 45088768
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1797488218e861f29c82cd605e5f8e59b1de4a75e0679180e847a3fc3f1df7de
|
3 |
+
size 50331648
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4830a6be1816a57e151027c5025f42f3436270c1dd20bdcf173903754cc260a4
|
3 |
+
size 50331648
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9afffda6fd81db3f70a444eddb0bf6d08213f686ad07e9bce6b5996acd92acfd
|
3 |
+
size 90177536
|