Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +34 -0
- config.json +27 -0
- mergekit_config.yml +17 -0
- merges.txt +0 -0
- model-00001-of-00015.safetensors +3 -0
- model-00001-of-00042.safetensors +3 -0
- model-00002-of-00015.safetensors +3 -0
- model-00002-of-00042.safetensors +3 -0
- model-00003-of-00015.safetensors +3 -0
- model-00003-of-00042.safetensors +3 -0
- model-00004-of-00015.safetensors +3 -0
- model-00004-of-00042.safetensors +3 -0
- model-00005-of-00015.safetensors +3 -0
- model-00005-of-00042.safetensors +3 -0
- model-00006-of-00015.safetensors +3 -0
- model-00006-of-00042.safetensors +3 -0
- model-00007-of-00015.safetensors +3 -0
- model-00007-of-00042.safetensors +3 -0
- model-00008-of-00015.safetensors +3 -0
- model-00008-of-00042.safetensors +3 -0
- model-00009-of-00015.safetensors +3 -0
- model-00009-of-00042.safetensors +3 -0
- model-00010-of-00015.safetensors +3 -0
- model-00010-of-00042.safetensors +3 -0
- model-00011-of-00015.safetensors +3 -0
- model-00011-of-00042.safetensors +3 -0
- model-00012-of-00015.safetensors +3 -0
- model-00012-of-00042.safetensors +3 -0
- model-00013-of-00015.safetensors +3 -0
- model-00013-of-00042.safetensors +3 -0
- model-00014-of-00015.safetensors +3 -0
- model-00014-of-00042.safetensors +3 -0
- model-00015-of-00015.safetensors +3 -0
- model-00015-of-00042.safetensors +3 -0
- model-00016-of-00042.safetensors +3 -0
- model-00017-of-00042.safetensors +3 -0
- model-00018-of-00042.safetensors +3 -0
- model-00019-of-00042.safetensors +3 -0
- model-00020-of-00042.safetensors +3 -0
- model-00021-of-00042.safetensors +3 -0
- model-00022-of-00042.safetensors +3 -0
- model-00023-of-00042.safetensors +3 -0
- model-00024-of-00042.safetensors +3 -0
- model-00025-of-00042.safetensors +3 -0
- model-00026-of-00042.safetensors +3 -0
- model-00027-of-00042.safetensors +3 -0
- model-00028-of-00042.safetensors +3 -0
- model-00029-of-00042.safetensors +3 -0
- model-00030-of-00042.safetensors +3 -0
- model-00031-of-00042.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
tags:
|
4 |
+
- merge
|
5 |
+
- Weyaxi/OpenHermes-2.5-neural-chat-v3-3-Slerp
|
6 |
+
- HuggingFaceH4/zephyr-7b-beta
|
7 |
+
---
|
8 |
+
|
9 |
+
# mistralai-7B-slerp-v0.1
|
10 |
+
|
11 |
+
mistralai-7B-slerp-v0.1 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
|
12 |
+
* [Weyaxi/OpenHermes-2.5-neural-chat-v3-3-Slerp](https://huggingface.co/Weyaxi/OpenHermes-2.5-neural-chat-v3-3-Slerp)
|
13 |
+
* [HuggingFaceH4/zephyr-7b-beta](https://huggingface.co/HuggingFaceH4/zephyr-7b-beta)
|
14 |
+
|
15 |
+
## 🧩 Configuration
|
16 |
+
|
17 |
+
```yaml
|
18 |
+
slices:
|
19 |
+
- sources:
|
20 |
+
- model: Weyaxi/OpenHermes-2.5-neural-chat-v3-3-Slerp
|
21 |
+
layer_range: [0, 32]
|
22 |
+
- model: HuggingFaceH4/zephyr-7b-beta
|
23 |
+
layer_range: [0, 32]
|
24 |
+
merge_method: slerp
|
25 |
+
base_model: Weyaxi/OpenHermes-2.5-neural-chat-v3-3-Slerp
|
26 |
+
parameters:
|
27 |
+
t:
|
28 |
+
- filter: self_attn
|
29 |
+
value: [0, 0.5, 0.3, 0.7, 1]
|
30 |
+
- filter: mlp
|
31 |
+
value: [1, 0.5, 0.7, 0.3, 0]
|
32 |
+
- value: 0.5 # fallback for rest of tensors
|
33 |
+
dtype: bfloat16
|
34 |
+
```
|
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "Weyaxi/OpenHermes-2.5-neural-chat-v3-3-Slerp",
|
3 |
+
"architectures": [
|
4 |
+
"MistralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"head_dim": 128,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 4096,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 14336,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "mistral",
|
16 |
+
"num_attention_heads": 32,
|
17 |
+
"num_hidden_layers": 32,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"rms_norm_eps": 1e-05,
|
20 |
+
"rope_theta": 10000.0,
|
21 |
+
"sliding_window": 4096,
|
22 |
+
"tie_word_embeddings": false,
|
23 |
+
"torch_dtype": "bfloat16",
|
24 |
+
"transformers_version": "4.47.1",
|
25 |
+
"use_cache": true,
|
26 |
+
"vocab_size": 32000
|
27 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
slices:
|
3 |
+
- sources:
|
4 |
+
- model: Weyaxi/OpenHermes-2.5-neural-chat-v3-3-Slerp
|
5 |
+
layer_range: [0, 32]
|
6 |
+
- model: HuggingFaceH4/zephyr-7b-beta
|
7 |
+
layer_range: [0, 32]
|
8 |
+
merge_method: slerp
|
9 |
+
base_model: Weyaxi/OpenHermes-2.5-neural-chat-v3-3-Slerp
|
10 |
+
parameters:
|
11 |
+
t:
|
12 |
+
- filter: self_attn
|
13 |
+
value: [0, 0.5, 0.3, 0.7, 1]
|
14 |
+
- filter: mlp
|
15 |
+
value: [1, 0.5, 0.7, 0.3, 0]
|
16 |
+
- value: 0.5 # fallback for rest of tensors
|
17 |
+
dtype: bfloat16
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c13195751872572280585048cfa57be875b1f2ba08c167c0ec35402247ec63e0
|
3 |
+
size 960521552
|
model-00001-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5839c81af91221e4d409b7fac2c3e7d348774887a39841e184ac73bc68e7c1f3
|
3 |
+
size 1027604608
|
model-00002-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c7fbd5c5031292a956f75e8f71567855948e5f55f925182dfe3979bf44cfdbf
|
3 |
+
size 989890720
|
model-00002-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acbd6b33e25c348a61135b2a83c242f2635fbf8212f1dd0b042d9bdf20226264
|
3 |
+
size 1027604624
|
model-00003-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:536c76a1fb46469d6de07e1058c7a81865de675f8eb93f8025c91abe821ec0c9
|
3 |
+
size 989890728
|
model-00003-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f56bb12d823b51abf8c03b3a39ee02195ec880bc6b2353c5b28213648eb5ded6
|
3 |
+
size 865106856
|
model-00004-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:995ca55c26e3c97175478c3f1ee95cc30a3b56f83580f15327c24b1e72547c7e
|
3 |
+
size 998287760
|
model-00004-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c02dddf7f39794ace456cf31afbacded441328e0d354939a444e881d41e1dc0
|
3 |
+
size 681595608
|
model-00005-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ef358a5900c19d9af76039b33f658a2a9c8529b8b34cb050685b298199eb885
|
3 |
+
size 947956216
|
model-00005-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02ab8006e4fc3fa959bb0693f67f440944f853056a287ce3def96a5693b02425
|
3 |
+
size 681595608
|
model-00006-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:202db32c0d6d1a3e6aa44cb95930c31606eb3fcd060f9c57151a30c43ae1bb31
|
3 |
+
size 989890728
|
model-00006-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e368d95bb3e84233da2416d096b453883486c51408c97ac6dab226c6fb9074c
|
3 |
+
size 681595608
|
model-00007-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d633bcef7bc4d29a761309c655e16fd280cfe7309985da2176d5daf9a19f7ec6
|
3 |
+
size 989890720
|
model-00007-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:faecb678494457303f884f74a1353ab6dc18d6ff579f4a9d9f3e75b4fc8b8da8
|
3 |
+
size 681595608
|
model-00008-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31ddf20807ff1510426f81cd57ea6f62a44c56623c0e247745ec18a9b460a3fd
|
3 |
+
size 998287760
|
model-00008-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a534413ad96845bedc575133175d94c30d67580c1f12f5bbe5613d1ac414717b
|
3 |
+
size 681595608
|
model-00009-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a464dfe9dfe3cfa914cd1c737654c29681b9b3cac9d2d44350b9c0706ecb61d4
|
3 |
+
size 947956216
|
model-00009-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3aeb919229d913950a4f48a2b2045b40447f77bc286848f37ca600141709a0a3
|
3 |
+
size 681595608
|
model-00010-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f6051c4dedcca801715686bf56e398fd96a85ff19289167244ebd4b92861aaf
|
3 |
+
size 989890728
|
model-00010-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b8aff17f78d53406231c36ea637554c85293aa2e410b58ba57f679b86de3728
|
3 |
+
size 681595608
|
model-00011-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fba2ffb170438ab90745984e7d9576834beec812146384a365ee566aae05d6af
|
3 |
+
size 989890728
|
model-00011-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbfc9bd06923f4ab5ebad6b86e6ace221a0dee1223c8737dab10da4b5c4876d6
|
3 |
+
size 681595608
|
model-00012-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e869ba69d194df4d9930d50deec6902d68e570ad66ca735f1ca507ea46362bfe
|
3 |
+
size 998287752
|
model-00012-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e2c79a11256f601c389276b79f174830c8a628d3ab7fc41e6e2125e5775d13e
|
3 |
+
size 681595608
|
model-00013-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fb7ec2eb4527f3c064ed69ba4540d6be88f8461bc2b5265e3036856ee0f64d9
|
3 |
+
size 947956200
|
model-00013-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:233352e838ba59a0ce09cbc65b803fe48ea5c0ce31d286a3b606abcc94a3073f
|
3 |
+
size 681595608
|
model-00014-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8c5eaa732cbc08d08186426c05e47bd1e52d8b8c008bffffc2eac814628fe22
|
3 |
+
size 989890712
|
model-00014-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:773fc0c6f72014ef74942446caf447f79e1c0e5b96c69fa27f34f5d60eb744e5
|
3 |
+
size 681595608
|
model-00015-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:028b913db5597362e67188449fcdceef9a7feb02b1a7cd69bdb14a9e5522bd33
|
3 |
+
size 755009440
|
model-00015-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0ed1732a4cabc211a1bd811d211d7a475647c365db3eddee76a13a754641895
|
3 |
+
size 681595608
|
model-00016-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83ecc2763438b229952bad3d56522abf42e0452d741f4252ecbe4e3d98356024
|
3 |
+
size 681595608
|
model-00017-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24f5469dcb217f9b6c9c229ed7554a44bdc5fa3c1072bd28859aedef6b2005fd
|
3 |
+
size 681595608
|
model-00018-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:583bbf3be9ad8fac2e4667b532b4a6fe2d077392e04a67d72b2c1c98f3621920
|
3 |
+
size 681595608
|
model-00019-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc5b7a5a2b16e870ed09d379d342d32c3e14e55c1ca26e20e1a83d8d2f6a9152
|
3 |
+
size 681595608
|
model-00020-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac4f65add044ee4edbd5ad029fe8c8050648bc61f62ee372336641e6336c651a
|
3 |
+
size 681595608
|
model-00021-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16bb9f0fbd7ea8268ec19e2fbaedcaad86cbacab770bced16f97753d29b22c78
|
3 |
+
size 681595608
|
model-00022-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e04caf2b9915d54752836eaf340c7921b7e8ad1a0d340ce37d3b22852b5aa1e8
|
3 |
+
size 681595608
|
model-00023-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d406b63579336d88a151c4badf9d5fdbaf516e154db952995869b3d4418baf7
|
3 |
+
size 681595608
|
model-00024-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16d050c6a225540034122cdff2c2ac4cfb642af6e8d80e1cdff9b536468d95e3
|
3 |
+
size 681595608
|
model-00025-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff66385953de62a59a9e516df7ba9e6428e5c177ec391e1244632455b7344bf0
|
3 |
+
size 681595608
|
model-00026-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbf7a1385dcfdccaa8354c3af4b07e29db3dceaf279b2dd15213fa6543d365c3
|
3 |
+
size 681595608
|
model-00027-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8094f5c5e2088956a2e2f1fdf042120bc2863832ea4a671ded5d021c846a4d55
|
3 |
+
size 681595608
|
model-00028-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9496171ac6cd9516e0b495baec4ce00bda39f288150fd26123098f0ce8791d9
|
3 |
+
size 681595608
|
model-00029-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e65d1843130fd3126d0a7b862b9ce789924b8e780b2326a45256fc940a9491c
|
3 |
+
size 681595608
|
model-00030-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d899a4efc2fc6bf3d44e812beac08096261f8ab6e2fcfc16152a4acf04f57904
|
3 |
+
size 681595608
|
model-00031-of-00042.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f330792cdfa7f55daebb772936f5fd6b345197a28cc7949fcf61e1dfe683ddf9
|
3 |
+
size 681595608
|