{ "train_losses": [ 0.0003613280423451215, 0.0011523436987772584, 7.812489639036357e-05, 0.0008105469169095159, -6.835948443040252e-05, 0.0010058593470603228, -0.00010742194717749953, -0.00013671873603016138, -0.0021679687779396772, 0.0005371093284338713, 4.882807843387127e-05, -0.002119140699505806, 0.0011035155039280653, 0.0008300781482830644, -0.0007128907018341124, 5.859363591298461e-05, 0.00020507792942225933, -0.002080078236758709, -0.0001171876210719347, -0.0001367187942378223, -0.00033203139901161194, -0.000898437574505806, -0.0005957031971774995, -0.0028808596543967724, 0.0001269530621357262, 0.0009277343051508069, 0.001748046837747097, -0.00327148474752903, -0.0008886720170266926, -0.0009374999790452421, 0.00028320305864326656, -0.0006445314502343535, -0.001103515736758709, -0.001679687760770321, -0.0016015628352761269, 0.0008691406110301614, -0.002128906548023224, 0.0008789062267169356, 0.000732421875, 0.0007812499534338713, -0.001230468973517418, -0.0017773439176380634, 0.0009277343051508069, -0.002490234561264515, -0.00019531260477378964, -0.0016992189921438694, 0.00021484363242052495, -0.00030273443553596735, -0.00018554690177552402, -0.0010156250791624188, -0.0002148438652511686, -0.00023437506752088666, 6.835925159975886e-05, 0.0003124999348074198, -0.0009277344215661287, -0.000859375053551048, 0.000849609321448952, -3.9062462747097015e-05, -0.0006054687546566129, -0.0015429689083248377, -0.0008496094960719347, -0.0037011723034083843, -3.9062550058588386e-05, 0.0005078123649582267, 0.00014648429350927472, -0.0004101564409211278, -0.0008300781482830644, -0.0011914062779396772, -0.001718750107102096, 0.0001269530621357262, -8.789071580395103e-05, 0.00041992179467342794, -0.0028417969588190317, 0.0008789062267169356, 0.0008593749371357262, 0.0001855467853602022, -0.0018066407646983862, -0.0006738282972946763, 0.00026367176906205714, -0.0031542968936264515, -0.0021386719308793545, -0.0013183595146983862, 0.0006738281226716936, -0.0010937501210719347, 0.0004980468656867743, 0.001416015555150807, -0.00017578131519258022, -0.0011425783159211278, 0.0005566406180150807, -0.00024414071231149137, -0.001914062537252903, -0.0026953124906867743, -0.000820312590803951, 0.00038085930282250047, 1.9531144062057137e-05, -0.0012011720100417733, 0.001015624962747097, -0.0006835939711891115, 0.0010058593470603228, 0.00031249987659975886, -0.002109374850988388, -1.9531260477378964e-05, 0.0009082030737772584, 0.0007617187220603228, 0.0008203124161809683, 0.00039062497671693563, -0.0006250001024454832, -0.0010058593470603228, -0.00030273443553596735, 0.0006640624487772584, -0.0010058593470603228, -0.00046874998952262104, -0.00016601569950580597, -0.0010351561941206455, -0.002392577938735485, -0.00025390629889443517, 0.0002636718563735485, 0.0002929687616415322, 0.000283203087747097, 0.00016601562674622983, 0.0002734375011641532, -0.000615234486758709, -0.0010546875419095159, 0.00023437495110556483, -0.00024414071231149137, 0.0006249999860301614, -0.0004199219401925802, -0.0003125000512227416, -0.0006249999860301614, 0.00041992185288108885, -0.002695312723517418, -0.005576171912252903, -0.0020605470053851604, 0.0007910155691206455, -0.0032324218191206455, -0.003095703199505806, 0.0006445312174037099, 0.00048828122089616954, -0.001220703125, -3.906257916241884e-05, -0.0013183595146983862, -0.0004003906506113708, 0.0004101562371943146, -0.0011230469681322575, 0.0005371093284338713, -0.00010742188896983862, -0.005966797471046448, -0.000244140625, -0.0005664062337018549, -0.0023828125558793545, 0.0005078124813735485, -0.002197265625, -0.0010742186568677425, -0.0021386719308793545, 0.00044921872904524207, -0.00036132821696810424, -0.0004589843738358468, -0.0002343750384170562, -0.00020507816225290298, -0.0001367187942378223, 0.0006738281226716936, 0.00048828122089616954, 0.00041992185288108885, -0.0004199218819849193, 0.0005468750023283064, -0.004150390625, 0.0004003905924037099, 9.765624417923391e-05, 0.00020507810404524207, -0.002236328087747097, -0.0004199218819849193, -0.0005371095612645149, 4.8828194849193096e-05, 0.0002441405667923391, -0.002246093936264515, 0.0003320312243886292, -0.00012695312034338713, -0.0020703128539025784, -0.003310547210276127, -0.0010449220426380634, -0.0006250001024454832, 0.00034179684007540345, 0.0008789062267169356, -2.929696347564459e-05, 0.00025390624068677425, 0.00032226560870185494, -0.0021875002421438694, -0.0004980469821020961, 0.0003320312243886292, -0.0008984376909211278, -0.0006738281808793545, -0.0010156251955777407, -0.00011718765017576516, -0.003017578274011612, -0.0013671875931322575 ], "test_losses": [ -0.33519999999999983, -0.1731999999999999, -0.0009999999999998404, -0.07839999999999994, -0.2763999999999999, -0.2005999999999999, -0.07279999999999989, -0.10079999999999996, -0.07419999999999993, 0.00020000000000011453, -0.22099999999999997, -0.15119999999999995, -0.25819999999999993, -0.2673999999999999, -0.2437999999999999, -0.22659999999999997, -0.2699999999999999, -0.24459999999999998, -0.16359999999999997 ], "config": { "training_type": "online_ppo", "environment": "MiniHack-River-Narrow-v0", "total_timesteps": 195, "training_time": 5415.230568885803, "device": "cuda", "ppo_config": { "learning_rate": 0.0003, "n_epochs": 4, "gamma": 0.99, "vf_coef": 0.5, "ent_coef": 0.01, "max_grad_norm": 0.5 }, "exploration_config": { "use_curiosity": false, "curiosity_dyn": false, "curiosity_skill_entropy": false, "curiosity_skill_transition_novelty": false, "curiosity_dyn_coef": 0.03, "curiosity_hdp_coef": 0.2, "curiosity_stn_coef": 0.05, "use_rnd": true, "rnd_lr": 0.001, "rnd_coef": 0.002 }, "model_sources": { "vae_repo_id": null, "hmm_repo_id": null } }, "final_train_loss": -0.0013671875931322575, "final_test_loss": -0.16359999999999997, "total_epochs": 195, "best_train_loss": -0.005966797471046448, "best_test_loss": -0.33519999999999983 }