JackBinary commited on
Commit
9f18c7c
·
verified ·
1 Parent(s): d5f6804

Add files using upload-large-folder tool

Browse files
README.md ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: mlc-llm
3
+ base_model: knifeayumu/Cydonia-v1.3-Magnum-v4-22B
4
+ tags:
5
+ - mlc-llm
6
+ - web-llm
7
+ ---
8
+
9
+ # Cydonia-v1.3-Magnum-v4-22B-q0f16-MLC
10
+
11
+ This is the [Cydonia-v1.3-Magnum-v4-22B](https://huggingface.co/knifeayumu/Cydonia-v1.3-Magnum-v4-22B) model in MLC format `q0f16`.
12
+ The model can be used with [MLC-LLM](https://github.com/mlc-ai/mlc-llm) and [WebLLM](https://github.com/mlc-ai/web-llm).
13
+
14
+ ## Example Usage
15
+
16
+ Before using the examples, please follow the [installation guide](https://llm.mlc.ai/docs/install/mlc_llm.html#install-mlc-packages).
17
+
18
+ ### Chat CLI
19
+
20
+ ```bash
21
+ mlc_llm chat HF://JackBinary/Cydonia-v1.3-Magnum-v4-22B-q0f16-MLC
22
+ ````
23
+
24
+ ### REST Server
25
+
26
+ ```bash
27
+ mlc_llm serve HF://JackBinary/Cydonia-v1.3-Magnum-v4-22B-q0f16-MLC
28
+ ```
29
+
30
+ ### Python API
31
+
32
+ ```python
33
+ from mlc_llm import MLCEngine
34
+
35
+ model = "HF://JackBinary/Cydonia-v1.3-Magnum-v4-22B-q0f16-MLC"
36
+ engine = MLCEngine(model)
37
+
38
+ for response in engine.chat.completions.create(
39
+ messages=[{"role": "user", "content": "What is the meaning of life?"}],
40
+ model=model,
41
+ stream=True,
42
+ ):
43
+ for choice in response.choices:
44
+ print(choice.delta.content, end="", flush=True)
45
+ print("\n")
46
+
47
+ engine.terminate()
48
+ ```
49
+
50
+ ## Documentation
51
+
52
+ For more on MLC LLM, visit the [documentation](https://llm.mlc.ai/docs/) and [GitHub repo](https://github.com/mlc-ai/mlc-llm).
mlc-chat-config.json ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "mistral",
4
+ "quantization": "q0f16",
5
+ "model_config": {
6
+ "hidden_size": 6144,
7
+ "intermediate_size": 16384,
8
+ "num_attention_heads": 48,
9
+ "num_hidden_layers": 56,
10
+ "rms_norm_eps": 1e-05,
11
+ "vocab_size": 32768,
12
+ "position_embedding_base": 1000000.0,
13
+ "num_key_value_heads": 8,
14
+ "head_dim": 128,
15
+ "context_window_size": 32768,
16
+ "sliding_window_size": -1,
17
+ "prefill_chunk_size": 8192,
18
+ "attention_sink_size": 4,
19
+ "tensor_parallel_shards": 1,
20
+ "max_batch_size": 128
21
+ },
22
+ "vocab_size": 32768,
23
+ "context_window_size": 32768,
24
+ "sliding_window_size": -1,
25
+ "prefill_chunk_size": 8192,
26
+ "attention_sink_size": 4,
27
+ "tensor_parallel_shards": 1,
28
+ "pipeline_parallel_stages": 1,
29
+ "temperature": 1.0,
30
+ "presence_penalty": 0.0,
31
+ "frequency_penalty": 0.0,
32
+ "repetition_penalty": 1.0,
33
+ "top_p": 1.0,
34
+ "tokenizer_files": [
35
+ "tokenizer.model",
36
+ "tokenizer.json",
37
+ "tokenizer_config.json"
38
+ ],
39
+ "tokenizer_info": {
40
+ "token_postproc_method": "byte_fallback",
41
+ "prepend_space_in_encode": false,
42
+ "strip_space_in_decode": false
43
+ },
44
+ "conv_template": {
45
+ "name": "mistral_default",
46
+ "system_template": "[INST] {system_message}",
47
+ "system_message": "Always assist with care, respect, and truth. Respond with utmost utility yet securely. Avoid harmful, unethical, prejudiced, or negative content. Ensure replies promote fairness and positivity.",
48
+ "system_prefix_token_ids": [
49
+ 1
50
+ ],
51
+ "add_role_after_system_message": false,
52
+ "roles": {
53
+ "user": "[INST]",
54
+ "assistant": "[/INST]",
55
+ "tool": "[INST]"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ " "
65
+ ],
66
+ "role_content_sep": " ",
67
+ "role_empty_sep": "",
68
+ "stop_str": [
69
+ "</s>"
70
+ ],
71
+ "stop_token_ids": [
72
+ 2
73
+ ],
74
+ "function_string": "",
75
+ "use_function_calling": false
76
+ },
77
+ "pad_token_id": 0,
78
+ "bos_token_id": 1,
79
+ "eos_token_id": 2
80
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d4476aa8c4475787006a54a18b75d4608c18a4b36e6a6b784c020574a1dc6f4
3
+ size 402653184
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:894b094b923350e37296eb158582421e7ce4c6399192df335c526d2059c8ef2d
3
+ size 75497472
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34fdf50cf739175ab3dc60f0be0a221623bff76141981e6fcc0122764af6a96a
3
+ size 402653184
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36079e0aa1eb1067495df6884dbd2a9458e21dae03aeb782278287e8f7b85d5f
3
+ size 201326592
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d279fd774ac9e2ef06400d4d15c395586aa5dedec6671a80ce69c83d0ca75eed
3
+ size 75497472
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f358b3e4757381a76111b04cc0f22ce09afd225f8ffd0455ed932830b93c1804
3
+ size 402653184
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8caef8d2f4cdfba0ac1c600fb39d050010ff033166bc265cfebe597d5c42c73a
3
+ size 100663296
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06c161f0638c17f2597b5289b50f1d4310f591353cfd9f5401fa49f26cc4eec2
3
+ size 75497472
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee494387c8dbcca4470d915c170024b5081201a00193c70ebe342a956dcd8290
3
+ size 201326592
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c942b2645ed19cb501a010d39fe5c5dd05405dcf7f3e8fc52e79e0d8b5ef3240
3
+ size 100663296
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9b09cd737b831ea5d437acc2f4319f0f1ca22a2023deca34e63183f7b9c486b
3
+ size 201326592
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcd80935b13bd0e1cd3c0d252d5bd6c1ac31b830aa1b0dfa6f0cee6a437b1251
3
+ size 100663296
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfd3a6cde85f179b70f1d4b53c3b9c08f8dcefb6c1cec1e84c5c1cfe43ed49c6
3
+ size 201326592
params_shard_142.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4f805fd5b011ca7b5c57be4dd654ff7840eb06ed9d32a306701e935ad6801b6
3
+ size 201326592
params_shard_153.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b957111ff7a98de73db365d8c867e5d6e7918991ed5f7e46d34ca54a75e06649
3
+ size 75497472
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69f0b0153ec9cdcd9d7a62e8f6b8e061b7318ba21a34c128e95e12d733e0e383
3
+ size 100663296
params_shard_166.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee1bb5cb14d199bcb96bee592f22681f56490aa127d48409f980771f763f411a
3
+ size 201326592
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:795d4b438867b5f218cc846c112caa26e8130c4827f8eddc39d540823b8a36d2
3
+ size 75497472
params_shard_175.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a784e7f24d55bae7c41b45fc2bb92fc4a08284fd3ab3b842e3c3ebb8e6fd666e
3
+ size 402653184
params_shard_190.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1030e1facfdc1d8752890f8cc8e6bf2bb1dd036503a357911e97dbf4de2f17
3
+ size 201326592
params_shard_202.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67dd3c8166c15dd3de7ca54885ed665dcc94178918a4d73e553dee13b37198b1
3
+ size 201326592
params_shard_212.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b97abb95fa048be2382b0a655bbade395e2b003b64415d879afdf1c186921bd
3
+ size 100663296
params_shard_214.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e573c8efafadab140759d1c9808acbd4ed9c5cbd83f365e315160fdbd5f1ac64
3
+ size 201326592
params_shard_218.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec709dc82c464bd1d11d3ec5c36ed2b34ac14181a2e5c8cead6c19439fc65065
3
+ size 201326592
params_shard_219.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a6e132609a6c5685d28079db9efd801f02e34a69b853c469c4774e395c53193
3
+ size 402653184
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec246edde36f218a4b10f6dff7fcf07f347bc1eb1496d1bbefe61994db1dc4e2
3
+ size 201326592
params_shard_220.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccb0b01fa6f2e91b7d6ee0edc29ad9135f8056ab089863dc549eca1aa6f19b6f
3
+ size 100663296
params_shard_221.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72fe3dfc740badd7523b6f3376ed6fc52ea1c903e874046b389d32226dae877e
3
+ size 75497472
params_shard_225.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cca4316483101c35a0c18076367e8131647d2f19db534d1b68f708aaae869473
3
+ size 75497472
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:893b1f8d5f4812cf9fe568cd46617324edca900d3ad005c2bb406f80b830170f
3
+ size 75497472
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bb73d48ae6817847a2264317186b4bde1f1d5baee61a4978a270fff7afdc31c
3
+ size 201326592
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81ab1c73b4a8cdb26e024e78fa3f87a1e28be34140fa62bd4dfc177e7facd4e1
3
+ size 75497472
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68f71db7d1c83dec991040eb05e562d8134db89ea32896b21144545e5f03817b
3
+ size 402653184
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d80fd1b847a65aac035fa832ead9cfc65b639954dc014327238d1df5cb0a5294
3
+ size 100663296
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9b3aa1fb7edaf6bc5b57e0a19dc41be0c0c73aff99de44abb15109a667cc7a3
3
+ size 201326592
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da2e43ca30e1d388766924574a99fdf903eb1e4d4961bfd6583def3d5cf1641e
3
+ size 75497472
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3f812fd040f9905aef91b1194607a2e02f5c22bea326c8f4d246863a90d22ed
3
+ size 100663296
params_shard_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:863610c71b9429ccbc9841781af19fdc60c27cc1c35f144c20aa732206633fb5
3
+ size 201326592
params_shard_63.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efe380cba5156ff69fd68275fb46f5384b097f4db58ae05e0f5861b660dd05e0
3
+ size 402653184
params_shard_67.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1774374649e1f2bb12f4b5639678def197de9332f460e76905aae5a8ca1ff4b3
3
+ size 402653184
params_shard_70.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05a4e5664a948bd0a6e419d96032dc6c95fbf82860ce95859503323df4f051ac
3
+ size 201326592
params_shard_77.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bda6bb6ea815b8d197babcc2a2fac5e6e065d4f6cdc41a7250c4b24bbdb848b
3
+ size 75497472
params_shard_8.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f07e67901c8d6ea0314536e26ab8ffe6b65627dbb8d6ed86b1a496abc65cfca4
3
+ size 100663296
params_shard_80.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a26c2c453eb3940a1ff281ae12e2ab1137030f3d63735f8d6c04cb01c9369c69
3
+ size 100663296
params_shard_82.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:585a5ecaf86b33ca5c4382daf7c7b77cf6d21119febf1df7e3fd5f73117b5dcc
3
+ size 201326592
params_shard_99.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61d53278651a4b421711ed51e717d0be30d5f2886556c59d7d784922e760f14a
3
+ size 402653184
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff