Add files using upload-large-folder tool
Browse files- LICENSE +21 -0
- assets/chat_template.jinja +90 -0
- config.json +66 -0
- generation_config.json +9 -0
- model-00091-of-000163.safetensors +3 -0
- model-00121-of-000163.safetensors +3 -0
- model-00123-of-000163.safetensors +3 -0
- model-00124-of-000163.safetensors +3 -0
- model-00125-of-000163.safetensors +3 -0
- model-00126-of-000163.safetensors +3 -0
- model-00127-of-000163.safetensors +3 -0
- model-00128-of-000163.safetensors +3 -0
- model-00129-of-000163.safetensors +3 -0
- model-00130-of-000163.safetensors +3 -0
- model-00131-of-000163.safetensors +3 -0
- model-00132-of-000163.safetensors +3 -0
- model-00133-of-000163.safetensors +3 -0
- model-00134-of-000163.safetensors +3 -0
- model-00135-of-000163.safetensors +3 -0
- model-00136-of-000163.safetensors +3 -0
- model-00137-of-000163.safetensors +3 -0
- model-00138-of-000163.safetensors +3 -0
- model-00139-of-000163.safetensors +3 -0
- model-00140-of-000163.safetensors +3 -0
- model-00141-of-000163.safetensors +3 -0
- model-00142-of-000163.safetensors +3 -0
- model-00143-of-000163.safetensors +3 -0
- model-00144-of-000163.safetensors +3 -0
- model-00145-of-000163.safetensors +3 -0
- model-00146-of-000163.safetensors +3 -0
- model-00147-of-000163.safetensors +3 -0
- model-00148-of-000163.safetensors +3 -0
- model-00149-of-000163.safetensors +3 -0
- model-00150-of-000163.safetensors +3 -0
- model-00151-of-000163.safetensors +3 -0
- model-00152-of-000163.safetensors +3 -0
- model-00153-of-000163.safetensors +3 -0
- model-00154-of-000163.safetensors +3 -0
- model-00155-of-000163.safetensors +3 -0
- model-00156-of-000163.safetensors +3 -0
- model-00157-of-000163.safetensors +3 -0
- model-00158-of-000163.safetensors +3 -0
- model-00159-of-000163.safetensors +3 -0
- model-00160-of-000163.safetensors +3 -0
- model-00161-of-000163.safetensors +3 -0
- model-00162-of-000163.safetensors +3 -0
- model-00163-of-000163.safetensors +3 -0
- model.safetensors.index.json +0 -0
- tokenizer.json +0 -0
- tokenizer_config.json +35 -0
LICENSE
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
MIT License
|
2 |
+
|
3 |
+
Copyright (c) 2023 DeepSeek
|
4 |
+
|
5 |
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
6 |
+
of this software and associated documentation files (the "Software"), to deal
|
7 |
+
in the Software without restriction, including without limitation the rights
|
8 |
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
9 |
+
copies of the Software, and to permit persons to whom the Software is
|
10 |
+
furnished to do so, subject to the following conditions:
|
11 |
+
|
12 |
+
The above copyright notice and this permission notice shall be included in all
|
13 |
+
copies or substantial portions of the Software.
|
14 |
+
|
15 |
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
16 |
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
17 |
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
18 |
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
19 |
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
20 |
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
21 |
+
SOFTWARE.
|
assets/chat_template.jinja
ADDED
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{% if not add_generation_prompt is defined %}
|
2 |
+
{% set add_generation_prompt = false %}
|
3 |
+
{% endif %}
|
4 |
+
{% if not thinking is defined %}
|
5 |
+
{% set thinking = false %}
|
6 |
+
{% endif %}
|
7 |
+
{% set ns = namespace(is_first=false, is_tool=false, system_prompt='', is_first_sp=true, is_last_user=false, is_only_sys=false, is_prefix=false) %}
|
8 |
+
{%- for message in messages %}
|
9 |
+
{%- if message['role'] == 'system' %}
|
10 |
+
{%- if ns.is_first_sp %}
|
11 |
+
{% set ns.system_prompt = ns.system_prompt + message['content'] %}
|
12 |
+
{% set ns.is_first_sp = false %}
|
13 |
+
{%- else %}
|
14 |
+
{% set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}
|
15 |
+
{%- endif %}
|
16 |
+
{% set ns.is_only_sys = true %}
|
17 |
+
{%- endif %}
|
18 |
+
{%- endfor %}
|
19 |
+
{{ bos_token }}{{ ns.system_prompt }}
|
20 |
+
{%- for message in messages %}
|
21 |
+
{%- if message['role'] == 'user' %}
|
22 |
+
{%- set ns.is_tool = false -%}
|
23 |
+
{%- set ns.is_first = false -%}
|
24 |
+
{%- set ns.is_last_user = true -%}
|
25 |
+
{{'<|User|>' + message['content']}}
|
26 |
+
{%- endif %}
|
27 |
+
{%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}
|
28 |
+
{%- if ns.is_last_user or ns.is_only_sys %}
|
29 |
+
{{'<|Assistant|></think>'}}
|
30 |
+
{%- endif %}
|
31 |
+
{%- set ns.is_last_user = false -%}
|
32 |
+
{%- set ns.is_first = false %}
|
33 |
+
{%- set ns.is_tool = false -%}
|
34 |
+
{%- for tool in message['tool_calls'] %}
|
35 |
+
{%- if not ns.is_first %}
|
36 |
+
{%- if message['content'] is none %}
|
37 |
+
{{'<|tool▁calls▁begin|><|tool▁call▁begin|>'+ tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}
|
38 |
+
{%- else %}
|
39 |
+
{{message['content'] + '<|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}
|
40 |
+
{%- endif %}
|
41 |
+
{%- set ns.is_first = true -%}
|
42 |
+
{%- else %}
|
43 |
+
{{'<|tool▁call▁begin|>'+ tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}
|
44 |
+
{%- endif %}
|
45 |
+
{%- endfor %}
|
46 |
+
{{'<|tool▁calls▁end|><|end▁of▁sentence|>'}}
|
47 |
+
{%- endif %}
|
48 |
+
{%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none) %}
|
49 |
+
{%- if ns.is_last_user %}
|
50 |
+
{{'<|Assistant|>'}}
|
51 |
+
{%- if message['prefix'] is defined and message['prefix'] and thinking %}
|
52 |
+
{{'<think>'}}
|
53 |
+
{%- else %}
|
54 |
+
{{'</think>'}}
|
55 |
+
{%- endif %}
|
56 |
+
{%- endif %}
|
57 |
+
{%- if message['prefix'] is defined and message['prefix'] %}
|
58 |
+
{%- set ns.is_prefix = true -%}
|
59 |
+
{%- endif %}
|
60 |
+
{%- set ns.is_last_user = false -%}
|
61 |
+
{%- if ns.is_tool %}
|
62 |
+
{{message['content'] + '<|end▁of▁sentence|>'}}
|
63 |
+
{%- set ns.is_tool = false -%}
|
64 |
+
{%- else %}
|
65 |
+
{%- set content = message['content'] -%}
|
66 |
+
{%- if '</think>' in content %}
|
67 |
+
{%- set content = content.split('</think>', 1)[1] -%}
|
68 |
+
{%- endif %}
|
69 |
+
{{content + '<|end▁of▁sentence|>'}}
|
70 |
+
{%- endif %}
|
71 |
+
{%- endif %}
|
72 |
+
{%- if message['role'] == 'tool' %}
|
73 |
+
{%- set ns.is_last_user = false -%}
|
74 |
+
{%- set ns.is_tool = true -%}
|
75 |
+
{{'<|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}
|
76 |
+
{%- endif %}
|
77 |
+
{%- if message['role'] != 'system' %}
|
78 |
+
{% set ns.is_only_sys = false %}
|
79 |
+
{%- endif %}
|
80 |
+
{%- endfor -%}
|
81 |
+
{% if add_generation_prompt and not ns.is_tool%}
|
82 |
+
{% if ns.is_last_user or ns.is_only_sys or not ns.is_prefix %}
|
83 |
+
{{'<|Assistant|>'}}
|
84 |
+
{%- if not thinking %}
|
85 |
+
{{'</think>'}}
|
86 |
+
{%- else %}
|
87 |
+
{{'<think>'}}
|
88 |
+
{%- endif %}
|
89 |
+
{% endif %}
|
90 |
+
{% endif %}
|
config.json
ADDED
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"DeepseekV32ForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_bias": false,
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"eos_token_id": 1,
|
9 |
+
"ep_size": 1,
|
10 |
+
"first_k_dense_replace": 3,
|
11 |
+
"hidden_act": "silu",
|
12 |
+
"hidden_size": 7168,
|
13 |
+
"index_head_dim": 128,
|
14 |
+
"index_n_heads": 64,
|
15 |
+
"index_topk": 2048,
|
16 |
+
"initializer_range": 0.02,
|
17 |
+
"intermediate_size": 18432,
|
18 |
+
"kv_lora_rank": 512,
|
19 |
+
"max_position_embeddings": 163840,
|
20 |
+
"model_type": "deepseek_v32",
|
21 |
+
"moe_intermediate_size": 2048,
|
22 |
+
"moe_layer_freq": 1,
|
23 |
+
"n_group": 8,
|
24 |
+
"n_routed_experts": 256,
|
25 |
+
"n_shared_experts": 1,
|
26 |
+
"norm_topk_prob": true,
|
27 |
+
"num_attention_heads": 128,
|
28 |
+
"num_experts_per_tok": 8,
|
29 |
+
"num_hidden_layers": 61,
|
30 |
+
"num_key_value_heads": 128,
|
31 |
+
"num_nextn_predict_layers": 1,
|
32 |
+
"q_lora_rank": 1536,
|
33 |
+
"qk_nope_head_dim": 128,
|
34 |
+
"qk_rope_head_dim": 64,
|
35 |
+
"quantization_config": {
|
36 |
+
"activation_scheme": "dynamic",
|
37 |
+
"fmt": "e4m3",
|
38 |
+
"quant_method": "fp8",
|
39 |
+
"scale_fmt": "ue8m0",
|
40 |
+
"weight_block_size": [
|
41 |
+
128,
|
42 |
+
128
|
43 |
+
]
|
44 |
+
},
|
45 |
+
"rms_norm_eps": 1e-06,
|
46 |
+
"rope_scaling": {
|
47 |
+
"beta_fast": 32,
|
48 |
+
"beta_slow": 1,
|
49 |
+
"factor": 40,
|
50 |
+
"mscale": 1.0,
|
51 |
+
"mscale_all_dim": 1.0,
|
52 |
+
"original_max_position_embeddings": 4096,
|
53 |
+
"type": "yarn"
|
54 |
+
},
|
55 |
+
"rope_theta": 10000,
|
56 |
+
"routed_scaling_factor": 2.5,
|
57 |
+
"scoring_func": "sigmoid",
|
58 |
+
"tie_word_embeddings": false,
|
59 |
+
"topk_group": 4,
|
60 |
+
"topk_method": "noaux_tc",
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.44.2",
|
63 |
+
"use_cache": true,
|
64 |
+
"v_head_dim": 128,
|
65 |
+
"vocab_size": 129280
|
66 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 0,
|
4 |
+
"eos_token_id": 1,
|
5 |
+
"do_sample": true,
|
6 |
+
"temperature": 0.6,
|
7 |
+
"top_p": 0.95,
|
8 |
+
"transformers_version": "4.46.3"
|
9 |
+
}
|
model-00091-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1af54d034a014c6dc7fcc31fe4dc12283dabd646663e0600e1c497ace317283f
|
3 |
+
size 4302384963
|
model-00121-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8220f4bba79bc539b5e9f620ee6bd011c2d7019ca5c87a1de756aadb6fd3a8fb
|
3 |
+
size 4302384963
|
model-00123-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:933a0047a3076f3567a12653492acdf8908ae1b949a50fd799037061856bf3a7
|
3 |
+
size 4302061105
|
model-00124-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb4c1d6160b67023093f34063e83c623f5fbf45397368f0d7b0e115e1cab3616
|
3 |
+
size 4302384914
|
model-00125-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d04ab22f6b81510a934adc41ab5f54101d1bd02598c6ad16c5f11f37e56f34ff
|
3 |
+
size 4302122764
|
model-00126-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2076aa18de4129c3458a0c615fab2c36eb587f25b6169a5b672ff67a3bc1cf9
|
3 |
+
size 4302384516
|
model-00127-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d257babe622d97e62bb47381cc22d68c8e5a33144aff16e7cef1e9332a2899b
|
3 |
+
size 4302384961
|
model-00128-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bdcc3e95bc69acdcd8719e856d46c5e9da452142fbfd31422f4cb26ce9b7b5b
|
3 |
+
size 4302122576
|
model-00129-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b867068ab2b0af1195c3d5150b4876fe0ae915e0a20778c31938b0652c5ab67
|
3 |
+
size 4302384704
|
model-00130-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e7762e1c24b582e683792613e3f2f51dfa56d3d9ba4469707c8608bf5b81b8b
|
3 |
+
size 4302384963
|
model-00131-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:038a877e36efb2db30228136973c596d70465eb815733ea78b2294048e9b3e53
|
3 |
+
size 4302122398
|
model-00132-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a44bd9d0c9321f8035a75c6884a1eb15d5095560718c20c32af8ed0f5b1ed42
|
3 |
+
size 4302384890
|
model-00133-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48c805a44a792608ed607e7b059a69f0d16d54296c9c30531ce0d34d143b1b61
|
3 |
+
size 4302122786
|
model-00134-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f60fcb87cbdd1cdc1065788f2d312ca408202847c18bae4b76861cc22bec25e1
|
3 |
+
size 4302384494
|
model-00135-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2ff2a81a95620f18bf7effe05fe88aae93b9da277051fb1179f5ea95a641b7c
|
3 |
+
size 4302384963
|
model-00136-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51a301d4251ceb67e4a4131bbe13b3e0392ea7d1e046baf70fa833073e37162c
|
3 |
+
size 4302122598
|
model-00137-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28ca58280396bacaed5822b50810a6ec18f50246f6f0e16d0d4b1ca7916d5003
|
3 |
+
size 4302384680
|
model-00138-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2188167c9a92f23abc688b811631af950c657ad11b6babb19193c484fb47c89
|
3 |
+
size 4302384963
|
model-00139-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:730e1f7a60a8dd668b9f66e19e845bf460c69ed16e1ca147536db454cb920dcf
|
3 |
+
size 4302122420
|
model-00140-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c9d97f77f84cb1f2ce648957c7c4a9a2e4be40517230dae34440713193be199
|
3 |
+
size 4302384870
|
model-00141-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:addafdbda4f4f2372d9bc6602ad2c9db41e08994801e65dcf80c2713cbb8f578
|
3 |
+
size 3245204828
|
model-00142-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7811d07e729bc554ca1d4cf6e483cb0ceadf77a15803fcc5a31c84508df1aa85
|
3 |
+
size 4302061105
|
model-00143-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af72ca4b9c78b8ed572ba6a802622b54137b83c2ae78b92e1b8c6ccd40b1484a
|
3 |
+
size 4302384914
|
model-00144-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:777d3e07c8e30327ea7636ddcc06d5b37d8c19f1eb316450e77c2bfbd60ce7d4
|
3 |
+
size 4302122764
|
model-00145-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45b82ca66094d7e6d33f6491017985530b3f8b090d74384c37ae0968ae3c018a
|
3 |
+
size 4302384516
|
model-00146-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c7ec67772c98355997775b5a29bae1de1322b365f515ef54c3bf980912d5497
|
3 |
+
size 4302384961
|
model-00147-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:933770f5b4431fb49e417bb2decea8ce1165b314103fd6bc41fd44b85c26e4a2
|
3 |
+
size 4302122576
|
model-00148-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a63c0e22abbac275a25a68eb94b92f10df68bb3c04adee8e1998e77cad3abfdb
|
3 |
+
size 4302384704
|
model-00149-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:038e8f71d61504303e233b1ccf6b247ecdc1a4e49c8ba6d88425884f04464a12
|
3 |
+
size 4302384963
|
model-00150-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17aa00caaf33e569adf3f0dd6f68ee25204b60f3de933d5c3a339d0aa58ed96f
|
3 |
+
size 4302122398
|
model-00151-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3143a333d78bfd9b04d1c901495bf9808a84ef264fad8db1a4a7303bd8de36e3
|
3 |
+
size 4302384890
|
model-00152-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:faab231af4888b4144a2b1e2ceefef95267720ce680a01b77b6e0939271c276a
|
3 |
+
size 4302122786
|
model-00153-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:541920f3455fd2af78183cb4dfc25c506ce3307aaef00747ec775c6a5f6b81c2
|
3 |
+
size 4302384494
|
model-00154-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb92a9b64c15767b0091689ee83e09f665575efd9828e9c23fbb4f3f0116bb38
|
3 |
+
size 4302384963
|
model-00155-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00e7db5d5886e70b2b1a00c726e0a16e479e09108b9cfcf50cd40477d110aecc
|
3 |
+
size 4302122598
|
model-00156-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f9173e6ff5ba68336cf89555a1a9012abb9603cfb2c2ceadde88e913c60ffff
|
3 |
+
size 4302384680
|
model-00157-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9753c9ccd4054c7376e118fda9ce26af382e14dfc5dae3e720fcd92163c40a0
|
3 |
+
size 4302384963
|
model-00158-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96779eff0e873144606f55d25b26e547a0e7d6dd7e43f293fd3022c41b3d0ab8
|
3 |
+
size 4302122420
|
model-00159-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ded32f0915daeec6f62f0362897adbe24cc4f182fd2654699e8031deca5b7ca8
|
3 |
+
size 4302384870
|
model-00160-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bebfda7d0b074448ff96a4db7f296c747b6bf99d1e37ae311a12bd6a1ff3517
|
3 |
+
size 5285723731
|
model-00161-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f74187acd4313d4f490232e3f4992ff17796cf1010ba878e21e64bc156beb168
|
3 |
+
size 4305819875
|
model-00162-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae44c570af0a2a0da07af3d04d9ee956013189d62b2d15b5da807604ecabe53e
|
3 |
+
size 4302384938
|
model-00163-of-000163.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6eef9fb48d5bdb7e09c7ed08d06b9a8bbf44726379e02e8f43d28cda7c921537
|
3 |
+
size 6643591758
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": true,
|
3 |
+
"add_eos_token": false,
|
4 |
+
"bos_token": {
|
5 |
+
"__type": "AddedToken",
|
6 |
+
"content": "<|begin▁of▁sentence|>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": true,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false
|
11 |
+
},
|
12 |
+
"clean_up_tokenization_spaces": false,
|
13 |
+
"eos_token": {
|
14 |
+
"__type": "AddedToken",
|
15 |
+
"content": "<|end▁of▁sentence|>",
|
16 |
+
"lstrip": false,
|
17 |
+
"normalized": true,
|
18 |
+
"rstrip": false,
|
19 |
+
"single_word": false
|
20 |
+
},
|
21 |
+
"legacy": true,
|
22 |
+
"model_max_length": 131072,
|
23 |
+
"pad_token": {
|
24 |
+
"__type": "AddedToken",
|
25 |
+
"content": "<|end▁of▁sentence|>",
|
26 |
+
"lstrip": false,
|
27 |
+
"normalized": true,
|
28 |
+
"rstrip": false,
|
29 |
+
"single_word": false
|
30 |
+
},
|
31 |
+
"sp_model_kwargs": {},
|
32 |
+
"unk_token": null,
|
33 |
+
"tokenizer_class": "LlamaTokenizerFast",
|
34 |
+
"chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% if not thinking is defined %}{% set thinking = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, system_prompt='', is_first_sp=true, is_last_user=false, is_only_sys=false, is_prefix=false) %}{%- for message in messages %}{%- if message['role'] == 'system' %}{%- if ns.is_first_sp %}{% set ns.system_prompt = ns.system_prompt + message['content'] %}{% set ns.is_first_sp = false %}{%- else %}{% set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}{%- endif %}{% set ns.is_only_sys = true %}{%- endif %}{%- endfor %}{{ bos_token }}{{ ns.system_prompt }}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{%- set ns.is_first = false -%}{%- set ns.is_last_user = true -%}{{'<|User|>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}{%- if ns.is_last_user or ns.is_only_sys %}{{'<|Assistant|></think>'}}{%- endif %}{%- set ns.is_last_user = false -%}{%- set ns.is_first = false %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls'] %}{%- if not ns.is_first %}{%- if message['content'] is none %}{{'<|tool▁calls▁begin|><|tool▁call▁begin|>'+ tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- else %}{{message['content'] + '<|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- endif %}{%- set ns.is_first = true -%}{%- else %}{{'<|tool▁call▁begin|>'+ tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- endif %}{%- endfor %}{{'<|tool▁calls▁end|><|end▁of▁sentence|>'}}{%- endif %}{%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none) %}{%- if ns.is_last_user %}{{'<|Assistant|>'}}{%- if message['prefix'] is defined and message['prefix'] and thinking %}{{'<think>'}}{%- else %}{{'</think>'}}{%- endif %}{%- endif %}{%- if message['prefix'] is defined and message['prefix'] %}{%- set ns.is_prefix = true -%}{%- endif %}{%- set ns.is_last_user = false -%}{%- if ns.is_tool %}{{message['content'] + '<|end▁of▁sentence|>'}}{%- set ns.is_tool = false -%}{%- else %}{%- set content = message['content'] -%}{%- if '</think>' in content %}{%- set content = content.split('</think>', 1)[1] -%}{%- endif %}{{content + '<|end▁of▁sentence|>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_last_user = false -%}{%- set ns.is_tool = true -%}{{'<|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- endif %}{%- if message['role'] != 'system' %}{% set ns.is_only_sys = false %}{%- endif %}{%- endfor -%}{% if add_generation_prompt and not ns.is_tool%}{% if ns.is_last_user or ns.is_only_sys or not ns.is_prefix %}{{'<|Assistant|>'}}{%- if not thinking %}{{'</think>'}}{%- else %}{{'<think>'}}{%- endif %}{% endif %}{% endif %}"
|
35 |
+
}
|