nethack-vae / training_data.json
CatkinChen's picture
Add training data
12413f5 verified
raw
history blame
2.3 kB
{
"train_losses": [
2100.769680175781,
1210.195811767578,
1176.4252709960938,
1143.586368408203,
1115.7994873046875,
1091.0681024169921,
1068.894476928711,
1061.0595739746093,
1048.5140423583985,
1030.019833984375,
1021.6400866699219,
1014.914428100586,
1012.0101983642578,
1008.9616821289062,
1007.0355267333985
],
"test_losses": [
1278.497021484375,
1241.6509338378905,
1210.9466491699218,
1211.009942626953,
1160.8113220214843,
1111.9551544189453,
1074.8253112792968,
1102.0312622070312,
1043.075909423828,
1020.9971008300781,
1005.1833709716797,
1002.2283630371094,
997.1159881591797,
993.3500823974609,
993.1695037841797
],
"config": {
"epochs": 15,
"batch_size": 32,
"max_learning_rate": 0.001,
"sequence_size": 32,
"shuffle_batches": true,
"shuffle_within_batch": true,
"vae_config": {
"latent_dim": 96,
"encoder_dropout": 0.1,
"decoder_dropout": 0.1,
"initial_mi_beta": 1.0,
"final_mi_beta": 1.0,
"mi_beta_shape": "constant",
"initial_tc_beta": 10.0,
"final_tc_beta": 10.0,
"tc_beta_shape": "constant",
"initial_dw_beta": 0.2,
"final_dw_beta": 1.0,
"dw_beta_shape": "custom",
"warmup_epoch_ratio": 0.2,
"free_bits": 0.15,
"focal_loss_alpha": 0.5,
"focal_loss_gamma": 2.0
},
"adaptive_weighting": {
"initial_mi_beta": 1.0,
"final_mi_beta": 1.0,
"mi_beta_shape": "constant",
"initial_tc_beta": 10.0,
"final_tc_beta": 10.0,
"tc_beta_shape": "constant",
"initial_dw_beta": 0.2,
"final_dw_beta": 1.0,
"dw_beta_shape": "custom",
"warmup_epoch_ratio": 0.2
},
"regularization": {
"encoder_dropout": 0.1,
"decoder_dropout": 0.1,
"free_bits": 0.15,
"focal_loss_alpha": 0.5,
"focal_loss_gamma": 2.0
},
"early_stopping": {
"enabled": false,
"patience": 3,
"min_delta": 0.01,
"triggered": false,
"best_epoch": null
}
},
"final_train_loss": 1007.0355267333985,
"final_test_loss": 993.1695037841797,
"total_epochs": 15,
"best_train_loss": 1007.0355267333985,
"best_test_loss": 993.1695037841797
}