| { |
| "MSE": 0.0, |
| "MSE/layer0": 0.0, |
| "dead_code_fraction": 1.0, |
| "dead_code_fraction/layer0": 1.0, |
| "epoch": 10.43, |
| "eval_MSE/layer0": 6073.8636798095695, |
| "eval_accuracy": 0.5791389432485323, |
| "eval_dead_code_fraction/layer0": 0.1981725, |
| "eval_input_norm/layer0": 0.7182212994247673, |
| "eval_loss": 1.6604058742523193, |
| "eval_multicode_k": 1, |
| "eval_output_norm/layer0": 76.78913438796998, |
| "eval_runtime": 6.7146, |
| "eval_samples": 100, |
| "eval_samples_per_second": 14.893, |
| "eval_steps_per_second": 0.298, |
| "input_norm": 0.0, |
| "input_norm/layer0": 0.0, |
| "loss": 1.6774777018260956, |
| "max_norm": 153.29054260253906, |
| "max_norm/layer0": 153.29054260253906, |
| "mean_norm": 75.17323780059814, |
| "mean_norm/layer0": 75.17323780059814, |
| "multicode_k": 1, |
| "output_norm": 0.0, |
| "output_norm/layer0": 0.0, |
| "perplexity": 5.261445896555633, |
| "runtime": 132212.7109, |
| "samples_per_second": 72.61, |
| "steps_per_second": 0.756, |
| "train_samples": 920563 |
| } |