poca-SoccerTwos / run_logs /timers.json
Brain33's picture
First Push
69e80e0 verified
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.438185214996338,
"min": 1.2871428728103638,
"max": 3.295762777328491,
"count": 5000
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 29546.078125,
"min": 18158.86328125,
"max": 128507.140625,
"count": 5000
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 80.08333333333333,
"min": 42.663716814159294,
"max": 999.0,
"count": 5000
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19220.0,
"min": 5000.0,
"max": 29028.0,
"count": 5000
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1725.4868357549199,
"min": 1193.015162420967,
"max": 1786.8978130593764,
"count": 4983
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 207058.42029059038,
"min": 2386.030324841934,
"max": 369536.6967138476,
"count": 4983
},
"SoccerTwos.Step.mean": {
"value": 49999983.0,
"min": 9530.0,
"max": 49999983.0,
"count": 5000
},
"SoccerTwos.Step.sum": {
"value": 49999983.0,
"min": 9530.0,
"max": 49999983.0,
"count": 5000
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.06711877137422562,
"min": -0.13952656090259552,
"max": 0.18732668459415436,
"count": 5000
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -8.121371269226074,
"min": -26.649574279785156,
"max": 26.909523010253906,
"count": 5000
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.06701740622520447,
"min": -0.1348048895597458,
"max": 0.19345541298389435,
"count": 5000
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -8.109106063842773,
"min": -25.696334838867188,
"max": 28.63368797302246,
"count": 5000
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 5000
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 5000
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.022000001481741912,
"min": -0.5714285714285714,
"max": 0.4471384584903717,
"count": 5000
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -2.6620001792907715,
"min": -77.37279975414276,
"max": 56.36819976568222,
"count": 5000
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.022000001481741912,
"min": -0.5714285714285714,
"max": 0.4471384584903717,
"count": 5000
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -2.6620001792907715,
"min": -77.37279975414276,
"max": 56.36819976568222,
"count": 5000
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 5000
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 5000
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.018539122284467642,
"min": 0.010676135318014228,
"max": 0.026691932663864767,
"count": 2422
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.018539122284467642,
"min": 0.010676135318014228,
"max": 0.026691932663864767,
"count": 2422
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.07924022773901622,
"min": 7.781588449991734e-06,
"max": 0.11845265949765842,
"count": 2422
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.07924022773901622,
"min": 7.781588449991734e-06,
"max": 0.11845265949765842,
"count": 2422
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.08009959459304809,
"min": 7.447628892502204e-06,
"max": 0.12023574585715929,
"count": 2422
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.08009959459304809,
"min": 7.447628892502204e-06,
"max": 0.12023574585715929,
"count": 2422
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 2422
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 2422
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.2,
"max": 0.20000000000000007,
"count": 2422
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.2,
"max": 0.20000000000000007,
"count": 2422
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005,
"max": 0.005000000000000001,
"count": 2422
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005,
"max": 0.005000000000000001,
"count": 2422
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1754278794",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/home/bolin/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.7.1+cu126",
"numpy_version": "1.23.5",
"end_time_seconds": "1754337377"
},
"total": 58583.416624648,
"count": 1,
"self": 0.1668565660074819,
"children": {
"run_training.setup": {
"total": 0.015344877000188717,
"count": 1,
"self": 0.015344877000188717
},
"TrainerController.start_learning": {
"total": 58583.234423204995,
"count": 1,
"self": 28.006689679357805,
"children": {
"TrainerController._reset_env": {
"total": 3.7130218009770033,
"count": 250,
"self": 3.7130218009770033
},
"TrainerController.advance": {
"total": 58551.44855011267,
"count": 3427750,
"self": 26.388956220180262,
"children": {
"env_step": {
"total": 23389.66532693994,
"count": 3427750,
"self": 19475.559716328786,
"children": {
"SubprocessEnvManager._take_step": {
"total": 3896.89595637029,
"count": 3427750,
"self": 182.23068291639538,
"children": {
"TorchPolicy.evaluate": {
"total": 3714.6652734538948,
"count": 6284314,
"self": 3714.6652734538948
}
}
},
"workers": {
"total": 17.20965424086353,
"count": 3427750,
"self": 0.0,
"children": {
"worker_root": {
"total": 58544.79750145348,
"count": 3427750,
"is_parallel": true,
"self": 42551.46606135835,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0014544330001626804,
"count": 2,
"is_parallel": true,
"self": 0.00036373899956743116,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0010906940005952492,
"count": 8,
"is_parallel": true,
"self": 0.0010906940005952492
}
}
},
"UnityEnvironment.step": {
"total": 0.012421765999988565,
"count": 1,
"is_parallel": true,
"self": 0.0003036180000890454,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0002772789998743974,
"count": 1,
"is_parallel": true,
"self": 0.0002772789998743974
},
"communicator.exchange": {
"total": 0.01087160400038556,
"count": 1,
"is_parallel": true,
"self": 0.01087160400038556
},
"steps_from_proto": {
"total": 0.000969264999639563,
"count": 2,
"is_parallel": true,
"self": 0.00022828999999546795,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0007409749996440951,
"count": 8,
"is_parallel": true,
"self": 0.0007409749996440951
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 15993.118884885997,
"count": 3427749,
"is_parallel": true,
"self": 900.4193676668183,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 612.4480266295209,
"count": 3427749,
"is_parallel": true,
"self": 612.4480266295209
},
"communicator.exchange": {
"total": 11950.058678117999,
"count": 3427749,
"is_parallel": true,
"self": 11950.058678117999
},
"steps_from_proto": {
"total": 2530.1928124716583,
"count": 6855498,
"is_parallel": true,
"self": 435.93581838643513,
"children": {
"_process_rank_one_or_two_observation": {
"total": 2094.256994085223,
"count": 27421992,
"is_parallel": true,
"self": 2094.256994085223
}
}
}
}
},
"steps_from_proto": {
"total": 0.21255520914064618,
"count": 498,
"is_parallel": true,
"self": 0.03900427415192098,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.1735509349887252,
"count": 1992,
"is_parallel": true,
"self": 0.1735509349887252
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 35135.39426695255,
"count": 3427750,
"self": 266.1699697615768,
"children": {
"process_trajectory": {
"total": 5083.07728814891,
"count": 3427750,
"self": 5076.223328915879,
"children": {
"RLTrainer._checkpoint": {
"total": 6.853959233030309,
"count": 100,
"self": 6.853959233030309
}
}
},
"_update_policy": {
"total": 29786.147009042066,
"count": 2422,
"self": 2878.9186776652605,
"children": {
"TorchPOCAOptimizer.update": {
"total": 26907.228331376806,
"count": 72672,
"self": 26907.228331376806
}
}
}
}
}
}
},
"trainer_threads": {
"total": 3.609966370277107e-07,
"count": 1,
"self": 3.609966370277107e-07
},
"TrainerController._save_models": {
"total": 0.06616125099390047,
"count": 1,
"self": 0.0009089379891520366,
"children": {
"RLTrainer._checkpoint": {
"total": 0.06525231300474843,
"count": 1,
"self": 0.06525231300474843
}
}
}
}
}
}
}