File size: 1,327 Bytes
c39c219
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51

models:
  - model: Retreatcost/KansenSakura-Radiance-RP-12b
    parameters:
      weight:
        - filter: self_attn
          value: [0.2, 0.25, 0.35, 0.55, 0.7, 0.8, 0.65, 0.4]
        - filter: mlp
          value: [0.25, 0.35, 0.25, 0.44]
        - filter: norm
          value: 0.35
        - value: 0.40
      density: 0.45
      epsilon: 0.25
  - model: Retreatcost/Ollpheist-12B
    parameters:
      weight:
        - filter: self_attn
          value: [0.0, 0.1, 0.25, 0.45, 0.55, 0.45, 0.25, 0.1]
        - filter: mlp
          value: [0.0, 0.15, 0.3, 0.5, 0.7, 0.55, 0.35, 0.15]
        - filter: norm
          value: 0.25
        - filter: lm_head
          value: 0.4
        - value: 0.25
      density: 0.4
      epsilon: 0.35
  - model: Vortex5/Shadow-Crystal-12B
    parameters:
      weight:
        - filter: self_attn
          value: [0.2, 0.2, 0.15, 0.35, 0.55, 0.55, 0.25, 0.6]
        - filter: mlp
          value: [0.0, 0.1, 0.25, 0.5, 0.4, 0.4, 0.65, 0.65]
        - filter: lm_head
          value: 0.55
        - filter: norm
          value: 0.15
        - value: 0.15
      density: 0.35
      epsilon: 0.25
merge_method: della
base_model: Vortex5/MegaMoon-Karcher-12B
parameters:
  lambda: 1.0
  normalize: true
dtype: bfloat16
tokenizer:
  source: Retreatcost/KansenSakura-Radiance-RP-12b