File size: 973 Bytes
c13b81e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
name: Q2.5-ColdBrew-R1-Obsidian
const_tag: &scale_factor 0.7071067812  # 1/sqrt(2) scaling for stability

attenuate-env: &attenuated_env
  parameters:
    scale:
      - filter: q_proj
        value: *scale_factor
      - filter: k_proj
        value: *scale_factor
      - value: 1.0

slices:
  - sources:
      - model: Theros/Qwen2.5-ColdBrew-R1
        layer_range: [0, 8]  # Retaining foundational knowledge and language structure.

  - sources:
      - model: Theros/Qwen2.5-ColdBrew-R1
        layer_range: [9, 19]  # Full-strength mid-range layers.

  - sources:
      - model: Theros/Qwen2.5-ColdBrew-R1
        layer_range: [10, 18]  # Targeted reinforcement, slightly attenuated to avoid over-dominance.
        <<: *attenuated_env

  - sources:
      - model: Theros/Qwen2.5-ColdBrew-R1
        layer_range: [19, 28]  # Keeping higher-level abstract processing untouched for stability.

merge_method: passthrough
dtype: bfloat16
normalize: true
int8_mask: true