DataSnake commited on
Commit
ed6b1a9
·
verified ·
1 Parent(s): c924e31

Upload 2 files

Browse files

Updated to use the correct files, which set `norm` to `2.0` for the observer to properly emulate MSE selection.

Files changed (2) hide show
  1. config.json +2 -1
  2. recipe.yaml +1 -1
config.json CHANGED
@@ -48,7 +48,8 @@
48
  "observer": "memoryless_mse",
49
  "observer_kwargs": {
50
  "grid": -2.0,
51
- "maxshrink": -1.0
 
52
  },
53
  "scale_dtype": "torch.float8_e4m3fn",
54
  "strategy": "tensor_group",
 
48
  "observer": "memoryless_mse",
49
  "observer_kwargs": {
50
  "grid": -2.0,
51
+ "maxshrink": -1.0,
52
+ "norm": 2.0
53
  },
54
  "scale_dtype": "torch.float8_e4m3fn",
55
  "strategy": "tensor_group",
recipe.yaml CHANGED
@@ -16,7 +16,7 @@ default_stage:
16
  scale_dtype: torch.float8_e4m3fn
17
  zp_dtype: null
18
  observer: memoryless_mse
19
- observer_kwargs: {maxshrink: -1.0, grid: -2.0}
20
  input_activations:
21
  num_bits: 4
22
  type: float
 
16
  scale_dtype: torch.float8_e4m3fn
17
  zp_dtype: null
18
  observer: memoryless_mse
19
+ observer_kwargs: {maxshrink: -1.0, grid: -2.0, norm: 2.0}
20
  input_activations:
21
  num_bits: 4
22
  type: float