File size: 1,327 Bytes
c39c219 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 |
models:
- model: Retreatcost/KansenSakura-Radiance-RP-12b
parameters:
weight:
- filter: self_attn
value: [0.2, 0.25, 0.35, 0.55, 0.7, 0.8, 0.65, 0.4]
- filter: mlp
value: [0.25, 0.35, 0.25, 0.44]
- filter: norm
value: 0.35
- value: 0.40
density: 0.45
epsilon: 0.25
- model: Retreatcost/Ollpheist-12B
parameters:
weight:
- filter: self_attn
value: [0.0, 0.1, 0.25, 0.45, 0.55, 0.45, 0.25, 0.1]
- filter: mlp
value: [0.0, 0.15, 0.3, 0.5, 0.7, 0.55, 0.35, 0.15]
- filter: norm
value: 0.25
- filter: lm_head
value: 0.4
- value: 0.25
density: 0.4
epsilon: 0.35
- model: Vortex5/Shadow-Crystal-12B
parameters:
weight:
- filter: self_attn
value: [0.2, 0.2, 0.15, 0.35, 0.55, 0.55, 0.25, 0.6]
- filter: mlp
value: [0.0, 0.1, 0.25, 0.5, 0.4, 0.4, 0.65, 0.65]
- filter: lm_head
value: 0.55
- filter: norm
value: 0.15
- value: 0.15
density: 0.35
epsilon: 0.25
merge_method: della
base_model: Vortex5/MegaMoon-Karcher-12B
parameters:
lambda: 1.0
normalize: true
dtype: bfloat16
tokenizer:
source: Retreatcost/KansenSakura-Radiance-RP-12b
|