Second Push

Browse files

Files changed (3) hide show

config.json +1 -1
configuration.yaml +2 -2
run_logs/timers.json +13 -348

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 5000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 20000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": ~~"./training-envs-executables/linux/SnowballTarget/SnowballTarget"~~, "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": ~~false~~, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 5000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 20000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": null, "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -45,7 +45,7 @@ behaviors:
     self_play: null
     behavioral_cloning: null
 env_settings:
-  env_path: ./training-envs-executables/linux/SnowballTarget/SnowballTarget
   env_args: null
   base_port: 5005
   num_envs: 1
@@ -69,7 +69,7 @@ checkpoint_settings:
   run_id: SnowballTarget1
   initialize_from: null
   load_model: false
-  resume: false
   force: false
   train_model: false
   inference: false

     self_play: null
     behavioral_cloning: null
 env_settings:
+  env_path: null
   env_args: null
   base_port: 5005
   num_envs: 1
   run_id: SnowballTarget1
   initialize_from: null
   load_model: false
+  resume: true
   force: false
   train_model: false
   inference: false

run_logs/timers.json CHANGED Viewed

@@ -1,375 +1,40 @@
 {
     "name": "root",
-    "gauges": {
-        "SnowballTarget.Policy.Entropy.mean": {
-            "value": 2.753169059753418,
-            "min": 2.753169059753418,
-            "max": 2.8581490516662598,
-            "count": 2
-        },
-        "SnowballTarget.Policy.Entropy.sum": {
-            "value": 28407.19921875,
-            "min": 28407.19921875,
-            "max": 29238.865234375,
-            "count": 2
-        },
-        "SnowballTarget.Step.mean": {
-            "value": 19992.0,
-            "min": 9952.0,
-            "max": 19992.0,
-            "count": 2
-        },
-        "SnowballTarget.Step.sum": {
-            "value": 19992.0,
-            "min": 9952.0,
-            "max": 19992.0,
-            "count": 2
-        },
-        "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 1.2926335334777832,
-            "min": 0.22984644770622253,
-            "max": 1.2926335334777832,
-            "count": 2
-        },
-        "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 264.9898681640625,
-            "min": 44.5902099609375,
-            "max": 264.9898681640625,
-            "count": 2
-        },
-        "SnowballTarget.Environment.EpisodeLength.mean": {
-            "value": 199.0,
-            "min": 199.0,
-            "max": 199.0,
-            "count": 2
-        },
-        "SnowballTarget.Environment.EpisodeLength.sum": {
-            "value": 10945.0,
-            "min": 8756.0,
-            "max": 10945.0,
-            "count": 2
-        },
-        "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.06690262798873328,
-            "min": 0.06681513686629949,
-            "max": 0.06690262798873328,
-            "count": 2
-        },
-        "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.33451313994366644,
-            "min": 0.26726054746519795,
-            "max": 0.33451313994366644,
-            "count": 2
-        },
-        "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.1909063190513966,
-            "min": 0.14033411378634397,
-            "max": 0.1909063190513966,
-            "count": 2
-        },
-        "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.9545315952569831,
-            "min": 0.5613364551453759,
-            "max": 0.9545315952569831,
-            "count": 2
-        },
-        "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 7.032007656e-05,
-            "min": 7.032007656e-05,
-            "max": 0.00021882002706000002,
-            "count": 2
-        },
-        "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 0.0003516003828,
-            "min": 0.0003516003828,
-            "max": 0.0008752801082400001,
-            "count": 2
-        },
-        "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.12344000000000002,
-            "min": 0.12344000000000002,
-            "max": 0.17294,
-            "count": 2
-        },
-        "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.6172000000000001,
-            "min": 0.6172000000000001,
-            "max": 0.69176,
-            "count": 2
-        },
-        "SnowballTarget.Policy.Beta.mean": {
-            "value": 0.0011796560000000003,
-            "min": 0.0011796560000000003,
-            "max": 0.003649706,
-            "count": 2
-        },
-        "SnowballTarget.Policy.Beta.sum": {
-            "value": 0.005898280000000001,
-            "min": 0.005898280000000001,
-            "max": 0.014598824,
-            "count": 2
-        },
-        "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 5.8,
-            "min": 3.7045454545454546,
-            "max": 5.8,
-            "count": 2
-        },
-        "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 319.0,
-            "min": 163.0,
-            "max": 319.0,
-            "count": 2
-        },
-        "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 5.8,
-            "min": 3.7045454545454546,
-            "max": 5.8,
-            "count": 2
-        },
-        "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 319.0,
-            "min": 163.0,
-            "max": 319.0,
-            "count": 2
-        },
-        "SnowballTarget.IsTraining.mean": {
-            "value": 1.0,
-            "min": 1.0,
-            "max": 1.0,
-            "count": 2
-        },
-        "SnowballTarget.IsTraining.sum": {
-            "value": 1.0,
-            "min": 1.0,
-            "max": 1.0,
-            "count": 2
-        }
-    },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1703602852",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.1.2+cu121",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1703602902"
     },
-    "total": 50.125385297999856,
     "count": 1,
-    "self": 0.697786748000226,
     "children": {
         "run_training.setup": {
-            "total": 0.050454570999818316,
             "count": 1,
-            "self": 0.050454570999818316
         },
         "TrainerController.start_learning": {
-            "total": 49.37714397899981,
             "count": 1,
-            "self": 0.0787745739996808,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 3.0169926449998457,
-                    "count": 1,
-                    "self": 3.0169926449998457
-                },
-                "TrainerController.advance": {
-                    "total": 46.19316564600035,
-                    "count": 1871,
-                    "self": 0.028356551004208086,
-                    "children": {
-                        "env_step": {
-                            "total": 46.164809094996144,
-                            "count": 1871,
-                            "self": 29.74730983299537,
-                            "children": {
-                                "SubprocessEnvManager._take_step": {
-                                    "total": 16.387860807994002,
-                                    "count": 1871,
-                                    "self": 0.1524993139955768,
-                                    "children": {
-                                        "TorchPolicy.evaluate": {
-                                            "total": 16.235361493998425,
-                                            "count": 1871,
-                                            "self": 16.235361493998425
-                                        }
-                                    }
-                                },
-                                "workers": {
-                                    "total": 0.029638454006772008,
-                                    "count": 1871,
-                                    "self": 0.0,
-                                    "children": {
-                                        "worker_root": {
-                                            "total": 49.19641676199808,
-                                            "count": 1871,
-                                            "is_parallel": true,
-                                            "self": 26.010392564993026,
-                                            "children": {
-                                                "run_training.setup": {
-                                                    "total": 0.0,
-                                                    "count": 0,
-                                                    "is_parallel": true,
-                                                    "self": 0.0,
-                                                    "children": {
-                                                        "steps_from_proto": {
-                                                            "total": 0.004247718999977224,
-                                                            "count": 1,
-                                                            "is_parallel": true,
-                                                            "self": 0.002968661000522843,
-                                                            "children": {
-                                                                "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.0012790579994543805,
-                                                                    "count": 10,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.0012790579994543805
-                                                                }
-                                                            }
-                                                        },
-                                                        "UnityEnvironment.step": {
-                                                            "total": 0.038339288999850396,
-                                                            "count": 1,
-                                                            "is_parallel": true,
-                                                            "self": 0.0006473079999977926,
-                                                            "children": {
-                                                                "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.0004000009998890164,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.0004000009998890164
-                                                                },
-                                                                "communicator.exchange": {
-                                                                    "total": 0.035240495999914856,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.035240495999914856
-                                                                },
-                                                                "steps_from_proto": {
-                                                                    "total": 0.002051484000048731,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.00038150400041558896,
-                                                                    "children": {
-                                                                        "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0016699799996331421,
-                                                                            "count": 10,
-                                                                            "is_parallel": true,
-                                                                            "self": 0.0016699799996331421
-                                                                        }
-                                                                    }
-                                                                }
-                                                            }
-                                                        }
-                                                    }
-                                                },
-                                                "UnityEnvironment.step": {
-                                                    "total": 23.186024197005054,
-                                                    "count": 1870,
-                                                    "is_parallel": true,
-                                                    "self": 1.0734497650196317,
-                                                    "children": {
-                                                        "UnityEnvironment._generate_step_input": {
-                                                            "total": 0.5612565489891495,
-                                                            "count": 1870,
-                                                            "is_parallel": true,
-                                                            "self": 0.5612565489891495
-                                                        },
-                                                        "communicator.exchange": {
-                                                            "total": 18.12054548700098,
-                                                            "count": 1870,
-                                                            "is_parallel": true,
-                                                            "self": 18.12054548700098
-                                                        },
-                                                        "steps_from_proto": {
-                                                            "total": 3.430772395995291,
-                                                            "count": 1870,
-                                                            "is_parallel": true,
-                                                            "self": 0.6510793549909977,
-                                                            "children": {
-                                                                "_process_rank_one_or_two_observation": {
-                                                                    "total": 2.7796930410042933,
-                                                                    "count": 18700,
-                                                                    "is_parallel": true,
-                                                                    "self": 2.7796930410042933
-                                                                }
-                                                            }
-                                                        }
-                                                    }
-                                                }
-                                            }
-                                        }
-                                    }
-                                }
-                            }
-                        }
-                    }
-                },
-                "trainer_threads": {
-                    "total": 0.00023758199995427276,
                     "count": 1,
-                    "self": 0.00023758199995427276,
-                    "children": {
-                        "thread_root": {
-                            "total": 0.0,
-                            "count": 0,
-                            "is_parallel": true,
-                            "self": 0.0,
-                            "children": {
-                                "trainer_advance": {
-                                    "total": 45.66180945898827,
-                                    "count": 68162,
-                                    "is_parallel": true,
-                                    "self": 1.3704156789815443,
-                                    "children": {
-                                        "process_trajectory": {
-                                            "total": 25.389689409007133,
-                                            "count": 68162,
-                                            "is_parallel": true,
-                                            "self": 24.697163631007015,
-                                            "children": {
-                                                "RLTrainer._checkpoint": {
-                                                    "total": 0.6925257780001175,
-                                                    "count": 4,
-                                                    "is_parallel": true,
-                                                    "self": 0.6925257780001175
-                                                }
-                                            }
-                                        },
-                                        "_update_policy": {
-                                            "total": 18.901704370999596,
-                                            "count": 9,
-                                            "is_parallel": true,
-                                            "self": 5.487976478997325,
-                                            "children": {
-                                                "TorchPPOOptimizer.update": {
-                                                    "total": 13.413727892002271,
-                                                    "count": 456,
-                                                    "is_parallel": true,
-                                                    "self": 13.413727892002271
-                                                }
-                                            }
-                                        }
-                                    }
-                                }
-                            }
-                        }
-                    }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.08797353199997815,
                     "count": 1,
-                    "self": 0.000934539000127188,
-                    "children": {
-                        "RLTrainer._checkpoint": {
-                            "total": 0.08703899299985096,
-                            "count": 1,
-                            "self": 0.08703899299985096
-                        }
-                    }
                 }
             }
         }

 {
     "name": "root",
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1703604205",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --run-id=SnowballTarget1 --resume --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.1.2+cu121",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1703604266"
     },
+    "total": 60.23162244000014,
     "count": 1,
+    "self": 0.03028296800039243,
     "children": {
         "run_training.setup": {
+            "total": 0.051774862999991456,
             "count": 1,
+            "self": 0.051774862999991456
         },
         "TrainerController.start_learning": {
+            "total": 60.14956460899975,
             "count": 1,
+            "self": 0.00011823599925264716,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 60.14940587700039,
                     "count": 1,
+                    "self": 60.14940587700039
                 },
                 "TrainerController._save_models": {
+                    "total": 4.049600011057919e-05,
                     "count": 1,
+                    "self": 4.049600011057919e-05
                 }
             }
         }