Upload 2 files
Browse filesUpdated to use the correct files, which set `norm` to `2.0` for the observer to properly emulate MSE selection.
- config.json +2 -1
- recipe.yaml +1 -1
config.json
CHANGED
|
@@ -48,7 +48,8 @@
|
|
| 48 |
"observer": "memoryless_mse",
|
| 49 |
"observer_kwargs": {
|
| 50 |
"grid": -2.0,
|
| 51 |
-
"maxshrink": -1.0
|
|
|
|
| 52 |
},
|
| 53 |
"scale_dtype": "torch.float8_e4m3fn",
|
| 54 |
"strategy": "tensor_group",
|
|
|
|
| 48 |
"observer": "memoryless_mse",
|
| 49 |
"observer_kwargs": {
|
| 50 |
"grid": -2.0,
|
| 51 |
+
"maxshrink": -1.0,
|
| 52 |
+
"norm": 2.0
|
| 53 |
},
|
| 54 |
"scale_dtype": "torch.float8_e4m3fn",
|
| 55 |
"strategy": "tensor_group",
|
recipe.yaml
CHANGED
|
@@ -16,7 +16,7 @@ default_stage:
|
|
| 16 |
scale_dtype: torch.float8_e4m3fn
|
| 17 |
zp_dtype: null
|
| 18 |
observer: memoryless_mse
|
| 19 |
-
observer_kwargs: {maxshrink: -1.0, grid: -2.0}
|
| 20 |
input_activations:
|
| 21 |
num_bits: 4
|
| 22 |
type: float
|
|
|
|
| 16 |
scale_dtype: torch.float8_e4m3fn
|
| 17 |
zp_dtype: null
|
| 18 |
observer: memoryless_mse
|
| 19 |
+
observer_kwargs: {maxshrink: -1.0, grid: -2.0, norm: 2.0}
|
| 20 |
input_activations:
|
| 21 |
num_bits: 4
|
| 22 |
type: float
|