Kyllene-57B-v1.0 / mergekit-config.yml
TeeZee's picture
Upload mergekit-config.yml
adc3440 verified
raw
history blame
No virus
574 Bytes
slices:
- sources:
- model: "../2xbagel-dpo-34b-v0.2"
layer_range: [0, 100]
- model: "../2xNous-Capybara-34B"
layer_range: [0, 100]
merge_method: slerp
base_model: "../2xbagel-dpo-34b-v0.2"
parameters:
t:
- filter: lm_head
value: [0.55]
- filter: embed_tokens
value: [0.7]
- filter: self_attn
value: [0.65, 0.35]
- filter: mlp
value: [0.35, 0.65]
- filter: layernorm
value: [0.4, 0.6]
- filter: modelnorm
value: [0.6]
- value: 0.5 # fallback for rest of tensors
dtype: float16