sarashina2.2-5.48B-instruct-no-tuning / config_sara_depth1.yml
kurogane's picture
Upload 12 files
118293d verified
raw
history blame contribute delete
607 Bytes
slices:
- sources:
- model: 'sarashina2.2-3b-instruct-v0.1'
layer_range: [0, 8]
- sources:
- model: 'sarashina2.2-3b-instruct-v0.1'
layer_range: [4, 12]
- sources:
- model: 'sarashina2.2-3b-instruct-v0.1'
layer_range: [8, 16]
- sources:
- model: 'sarashina2.2-3b-instruct-v0.1'
layer_range: [12, 20]
- sources:
- model: 'sarashina2.2-3b-instruct-v0.1'
layer_range: [16, 24]
- sources:
- model: 'sarashina2.2-3b-instruct-v0.1'
layer_range: [20, 28]
- sources:
- model: 'sarashina2.2-3b-instruct-v0.1'
layer_range: [24, 32]
merge_method: passthrough
dtype: bfloat16