Gemma-The-Writer-DEADLINE-10B / mergekit_config.yml
DavidAU's picture
Upload folder using huggingface_hub
3c081fe verified
raw
history blame
1.62 kB
# Six splits plus "end game
# "D" starts at plus .1 VS D/O proj.
# 40 plus.
slices:
- sources:
- model: J:/Gemma-The-Writer-9B
layer_range: [0, 41]
# O PROJ, DPROJ to .3333 /
# end game
- sources:
- model: J:/Gemma-The-Writer-9B
layer_range: [41, 42]
parameters:
scale:
- filter: o_proj
value: 0.3333333333333
- filter: down_proj
value: 0.3333333333333
- value: 0.3333333333333
- sources:
- model: J:/Gemma-The-Writer-9B
layer_range: [41, 42]
parameters:
scale:
- filter: o_proj
value: 0.4444444444444
- filter: down_proj
value: 0.4444444444444
- value: 0.4444444444444
- sources:
- model: J:/Gemma-The-Writer-9B
layer_range: [41, 42]
parameters:
scale:
- filter: o_proj
value: 0.5555555555555
- filter: down_proj
value: 0.5555555555555
- value: 0.5555555555555
- sources:
- model: J:/Gemma-The-Writer-9B
layer_range: [41, 42]
parameters:
scale:
- filter: o_proj
value: 0.6666666666666
- filter: down_proj
value: 0.6666666666666
- value: 0.6666666666666
- sources:
- model: J:/Gemma-The-Writer-9B
layer_range: [41, 42]
parameters:
scale:
- filter: o_proj
value: 0.777777777777
- filter: down_proj
value: 0.777777777777
- value: 0.888888888888
merge_method: passthrough
dtype: bfloat16