nethack-vae / training_data.json
CatkinChen's picture
Add training data
09cc336 verified
raw
history blame
2.31 kB
{
"train_losses": [
2111.7611865234376,
1212.1435998535155,
1171.34529296875,
1136.2398962402344,
1109.2583923339844,
1089.3295330810547,
1077.6256915283202,
1068.5979656982422,
1046.4885858154296,
1034.4147955322267,
1022.2338330078124,
1016.7246740722657,
1011.3862927246093,
1008.4382983398438,
1007.1079608154297
],
"test_losses": [
1288.1074951171875,
1239.0845153808593,
1217.204327392578,
1174.8377197265625,
1152.8598571777343,
1145.8320037841797,
1117.911279296875,
1115.5450775146485,
1055.7722442626953,
1037.2113189697266,
1013.2753051757812,
1005.9470703125,
1003.9286956787109,
999.6026977539062,
998.8647766113281
],
"config": {
"epochs": 15,
"batch_size": 32,
"max_learning_rate": 0.001,
"sequence_size": 32,
"shuffle_batches": true,
"shuffle_within_batch": true,
"vae_config": {
"latent_dim": 96,
"encoder_dropout": 0.1,
"decoder_dropout": 0.1,
"initial_mi_beta": 1.0,
"final_mi_beta": 1.0,
"mi_beta_shape": "constant",
"initial_tc_beta": 10.0,
"final_tc_beta": 10.0,
"tc_beta_shape": "constant",
"initial_dw_beta": 0.2,
"final_dw_beta": 1.0,
"dw_beta_shape": "custom",
"warmup_epoch_ratio": 0.2,
"free_bits": 0.15,
"focal_loss_alpha": 0.5,
"focal_loss_gamma": 2.0
},
"adaptive_weighting": {
"initial_mi_beta": 1.0,
"final_mi_beta": 1.0,
"mi_beta_shape": "constant",
"initial_tc_beta": 10.0,
"final_tc_beta": 10.0,
"tc_beta_shape": "constant",
"initial_dw_beta": 0.2,
"final_dw_beta": 1.0,
"dw_beta_shape": "custom",
"warmup_epoch_ratio": 0.2
},
"regularization": {
"encoder_dropout": 0.1,
"decoder_dropout": 0.1,
"free_bits": 0.15,
"focal_loss_alpha": 0.5,
"focal_loss_gamma": 2.0
},
"early_stopping": {
"enabled": false,
"patience": 3,
"min_delta": 0.01,
"triggered": false,
"best_epoch": null
}
},
"final_train_loss": 1007.1079608154297,
"final_test_loss": 998.8647766113281,
"total_epochs": 15,
"best_train_loss": 1007.1079608154297,
"best_test_loss": 998.8647766113281
}