Neo_7b-merge2 / mergekit_config.yml
DewEfresh's picture
Upload folder using huggingface_hub
a71c1d1 verified
raw
history blame
1.44 kB
slices:
# Group 1
- sources:
- model: m-a-p/neo_7b
layer_range: [0, 0]
- model: m-a-p/neo_7b
layer_range: [3, 3]
- sources:
- model: m-a-p/neo_7b
layer_range: [1, 1]
- model: m-a-p/neo_7b
layer_range: [3, 3]
- sources:
- model: m-a-p/neo_7b
layer_range: [2, 2]
- model: m-a-p/neo_7b
layer_range: [3, 3]
# Group 2
- sources:
- model: m-a-p/neo_7b
layer_range: [4, 4]
- model: m-a-p/neo_7b
layer_range: [7, 7]
- sources:
- model: m-a-p/neo_7b
layer_range: [5, 5]
- model: m-a-p/neo_7b
layer_range: [7, 7]
- sources:
- model: m-a-p/neo_7b
layer_range: [6, 6]
- model: m-a-p/neo_7b
layer_range: [7, 7]
# Continue this pattern for the remaining groups...
# Group 7 (last group)
- sources:
- model: m-a-p/neo_7b
layer_range: [24, 24]
- model: m-a-p/neo_7b
layer_range: [27, 27]
- sources:
- model: m-a-p/neo_7b
layer_range: [25, 25]
- model: m-a-p/neo_7b
layer_range: [27, 27]
- sources:
- model: m-a-p/neo_7b
layer_range: [26, 26]
- model: m-a-p/neo_7b
layer_range: [27, 27]
merge_method: slerp
base_model: m-a-p/neo_7b
parameters:
t: 0.3333 # Apply 1/3 of the 4th layer to each of the previous 3 layers
dtype: bfloat16
output_path: ./merged_redistributed_neo_7b