Bagel-DareDevil-8B-Llama3 / mergekit_config.yml
mrcuddle's picture
Upload folder using huggingface_hub
96d5642 verified
raw
history blame contribute delete
500 Bytes
slices:
- sources:
- model: mlabonne/Daredevil-7B
layer_range: [0, 32] # Adjust based on the actual number of layers
- model: mrcuddle/Bagel-Hermes-Lumimaid-Llama3-8B
layer_range: [0, 32] # Adjust based on the actual number of layers
merge_method: slerp
base_model: mrcuddle/Bagel-Hermes-Lumimaid-Llama3-8B
parameters:
t:
- filter: self_attn
value: [0, 0.5, 0.3, 0.7, 1]
- filter: mlp
value: [1, 0.5, 0.7, 0.3, 0]
- value: 0.5
dtype: bfloat16