models: - model: nitky/Swallow-70b-RP # no parameters necessary for base model - model: karakuri-ai/karakuri-lm-70b-chat-v0.1 parameters: density: 1 weight: - filter: mlp value: 0.1 - filter: self_attn value: 0.4 - value: 0 # fallback for rest of tensors. merge_method: dare_ties base_model: nitky/Swallow-70b-RP dtype: bfloat16 tokenizer_source: union name: Swallow-70b-RP-EX-base --- models: - model: nitky/Swallow-70b-RP # no parameters necessary for base model - model: karakuri-ai/karakuri-lm-70b-chat-v0.1 parameters: density: 1 weight: - filter: mlp value: [0.4, 0.1, 0.4, 0.1, 0.4, 0.1, 0.4, 0.1, 0.1] - filter: self_attn value: [0.4, 0.4, 0.1, 0.4, 0.1, 0.4, 0.1, 0.4, 0.4] - value: 0 # fallback for rest of tensors. merge_method: dare_ties base_model: nitky/Swallow-70b-RP dtype: bfloat16 tokenizer_source: union name: Swallow-70b-RP-EX-flavor --- slices: - sources: - model: Swallow-70b-RP-EX-base layer_range: [0, 80] - model: Swallow-70b-RP-EX-flavor layer_range: [0, 80] merge_method: slerp base_model: Swallow-70b-RP-EX-base parameters: t: # model stabilization - filter: self_attn value: [0, 0.5, 0.3, 0.7, 1] - filter: mlp value: [1, 0.5, 0.7, 0.3, 0] - value: 0.5 # fallback for rest of tensors dtype: bfloat16 name: Swallow-70b-RP-EX