First Push

Browse files

Files changed (5) hide show

README.md +4 -4
config.json +1 -1
configuration.yaml +24 -11
run_logs/timers.json +15 -345
run_logs/training_status.json +0 -58

README.md CHANGED Viewed

@@ -1,14 +1,14 @@
 ---
 library_name: ml-agents
 tags:
-- SnowballTarget
 - deep-reinforcement-learning
 - reinforcement-learning
-- ML-Agents-SnowballTarget
 ---
-  # **ppo** Agent playing **SnowballTarget**
-  This is a trained model of a **ppo** agent playing **SnowballTarget**
   using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
   ## Usage (with ML-Agents)

 ---
 library_name: ml-agents
 tags:
+- Pyramids
 - deep-reinforcement-learning
 - reinforcement-learning
+- ML-Agents-Pyramids
 ---
+  # **ppo** Agent playing **Pyramids**
+  This is a trained model of a **ppo** agent playing **Pyramids**
   using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
   ## Usage (with ML-Agents)

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"~~SnowballTarget~~": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.~~005~~, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": ~~50000~~, "network_settings": {"normalize": false, "hidden_units": ~~256~~, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": ~~200000~~, "time_horizon": 64, "summary_freq": ~~10000~~, "threaded": ~~true~~, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/~~SnowballTarget~~/~~SnowballTarget~~", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "~~SnowballTarget1~~", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"Pyramids": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}, "rnd": {"gamma": 0.99, "strength": 0.01, "network_settings": {"normalize": false, "hidden_units": 64, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "learning_rate": 0.0001, "encoding_size": null}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 1000000, "time_horizon": 128, "summary_freq": 30000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/Pyramids/Pyramids", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "Pyramids Training", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -1,12 +1,12 @@
 default_settings: null
 behaviors:
-  SnowballTarget:
     trainer_type: ppo
     hyperparameters:
       batch_size: 128
       buffer_size: 2048
       learning_rate: 0.0003
-      beta: 0.005
       epsilon: 0.2
       lambd: 0.95
       num_epoch: 3
@@ -14,10 +14,10 @@ behaviors:
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
-    checkpoint_interval: 50000
     network_settings:
       normalize: false
-      hidden_units: 256
       num_layers: 2
       vis_encode_type: simple
       memory: null
@@ -35,17 +35,30 @@ behaviors:
           memory: null
           goal_conditioning_type: hyper
           deterministic: false
     init_path: null
-    keep_checkpoints: 10
     even_checkpoints: false
-    max_steps: 200000
-    time_horizon: 64
-    summary_freq: 10000
-    threaded: true
     self_play: null
     behavioral_cloning: null
 env_settings:
-  env_path: ./training-envs-executables/linux/SnowballTarget/SnowballTarget
   env_args: null
   base_port: 5005
   num_envs: 1
@@ -66,7 +79,7 @@ engine_settings:
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
-  run_id: SnowballTarget1
   initialize_from: null
   load_model: false
   resume: false

 default_settings: null
 behaviors:
+  Pyramids:
     trainer_type: ppo
     hyperparameters:
       batch_size: 128
       buffer_size: 2048
       learning_rate: 0.0003
+      beta: 0.01
       epsilon: 0.2
       lambd: 0.95
       num_epoch: 3
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
+    checkpoint_interval: 500000
     network_settings:
       normalize: false
+      hidden_units: 512
       num_layers: 2
       vis_encode_type: simple
       memory: null
           memory: null
           goal_conditioning_type: hyper
           deterministic: false
+      rnd:
+        gamma: 0.99
+        strength: 0.01
+        network_settings:
+          normalize: false
+          hidden_units: 64
+          num_layers: 3
+          vis_encode_type: simple
+          memory: null
+          goal_conditioning_type: hyper
+          deterministic: false
+        learning_rate: 0.0001
+        encoding_size: null
     init_path: null
+    keep_checkpoints: 5
     even_checkpoints: false
+    max_steps: 1000000
+    time_horizon: 128
+    summary_freq: 30000
+    threaded: false
     self_play: null
     behavioral_cloning: null
 env_settings:
+  env_path: ./training-envs-executables/linux/Pyramids/Pyramids
   env_args: null
   base_port: 5005
   num_envs: 1
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
+  run_id: Pyramids Training
   initialize_from: null
   load_model: false
   resume: false

run_logs/timers.json CHANGED Viewed

@@ -1,375 +1,45 @@
 {
     "name": "root",
-    "gauges": {
-        "SnowballTarget.Policy.Entropy.mean": {
-            "value": 0.9914730787277222,
-            "min": 0.9914730787277222,
-            "max": 2.873957633972168,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Entropy.sum": {
-            "value": 9499.3037109375,
-            "min": 9499.3037109375,
-            "max": 29495.427734375,
-            "count": 20
-        },
-        "SnowballTarget.Step.mean": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
-        },
-        "SnowballTarget.Step.sum": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 12.96503734588623,
-            "min": 0.3656828999519348,
-            "max": 12.96503734588623,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2528.182373046875,
-            "min": 70.9424819946289,
-            "max": 2602.71875,
-            "count": 20
-        },
-        "SnowballTarget.Environment.EpisodeLength.mean": {
-            "value": 199.0,
-            "min": 199.0,
-            "max": 199.0,
-            "count": 20
-        },
-        "SnowballTarget.Environment.EpisodeLength.sum": {
-            "value": 8756.0,
-            "min": 8756.0,
-            "max": 10945.0,
-            "count": 20
-        },
-        "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.06374345075849253,
-            "min": 0.06169963288562476,
-            "max": 0.07582122400430415,
-            "count": 20
-        },
-        "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.2549738030339701,
-            "min": 0.24679853154249903,
-            "max": 0.36523728684508516,
-            "count": 20
-        },
-        "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.20116959263881046,
-            "min": 0.09848128757256941,
-            "max": 0.2898164811525859,
-            "count": 20
-        },
-        "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.8046783705552418,
-            "min": 0.39392515029027764,
-            "max": 1.3678632022119035,
-            "count": 20
-        },
-        "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 8.082097306000005e-06,
-            "min": 8.082097306000005e-06,
-            "max": 0.000291882002706,
-            "count": 20
-        },
-        "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 3.232838922400002e-05,
-            "min": 3.232838922400002e-05,
-            "max": 0.00138516003828,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.10269400000000001,
-            "min": 0.10269400000000001,
-            "max": 0.19729400000000002,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.41077600000000003,
-            "min": 0.41077600000000003,
-            "max": 0.96172,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Beta.mean": {
-            "value": 0.0001444306000000001,
-            "min": 0.0001444306000000001,
-            "max": 0.0048649706,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Beta.sum": {
-            "value": 0.0005777224000000004,
-            "min": 0.0005777224000000004,
-            "max": 0.023089828,
-            "count": 20
-        },
-        "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 25.886363636363637,
-            "min": 2.8636363636363638,
-            "max": 25.886363636363637,
-            "count": 20
-        },
-        "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1139.0,
-            "min": 126.0,
-            "max": 1393.0,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 25.886363636363637,
-            "min": 2.8636363636363638,
-            "max": 25.886363636363637,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 1139.0,
-            "min": 126.0,
-            "max": 1393.0,
-            "count": 20
-        },
-        "SnowballTarget.IsTraining.mean": {
-            "value": 1.0,
-            "min": 1.0,
-            "max": 1.0,
-            "count": 20
-        },
-        "SnowballTarget.IsTraining.sum": {
-            "value": 1.0,
-            "min": 1.0,
-            "max": 1.0,
-            "count": 20
-        }
-    },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1707941657",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.2.0+cu121",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1707942274"
     },
-    "total": 616.9848276049999,
     "count": 1,
-    "self": 0.5305121579997376,
     "children": {
         "run_training.setup": {
-            "total": 0.07121669399998609,
             "count": 1,
-            "self": 0.07121669399998609
         },
         "TrainerController.start_learning": {
-            "total": 616.3830987530001,
             "count": 1,
-            "self": 0.9253966029928051,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 4.86483831399994,
                     "count": 1,
-                    "self": 4.86483831399994
-                },
-                "TrainerController.advance": {
-                    "total": 610.4914103100073,
-                    "count": 18203,
-                    "self": 0.44134618003295145,
-                    "children": {
-                        "env_step": {
-                            "total": 610.0500641299743,
-                            "count": 18203,
-                            "self": 469.4286792179771,
-                            "children": {
-                                "SubprocessEnvManager._take_step": {
-                                    "total": 140.18064394098474,
-                                    "count": 18203,
-                                    "self": 2.7716976129713657,
-                                    "children": {
-                                        "TorchPolicy.evaluate": {
-                                            "total": 137.40894632801337,
-                                            "count": 18203,
-                                            "self": 137.40894632801337
-                                        }
-                                    }
-                                },
-                                "workers": {
-                                    "total": 0.4407409710124739,
-                                    "count": 18203,
-                                    "self": 0.0,
-                                    "children": {
-                                        "worker_root": {
-                                            "total": 614.3191371800239,
-                                            "count": 18203,
-                                            "is_parallel": true,
-                                            "self": 289.1690472830177,
-                                            "children": {
-                                                "run_training.setup": {
-                                                    "total": 0.0,
-                                                    "count": 0,
-                                                    "is_parallel": true,
-                                                    "self": 0.0,
-                                                    "children": {
-                                                        "steps_from_proto": {
-                                                            "total": 0.007789372000047479,
-                                                            "count": 1,
-                                                            "is_parallel": true,
-                                                            "self": 0.0055618820002791836,
-                                                            "children": {
-                                                                "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.002227489999768295,
-                                                                    "count": 10,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.002227489999768295
-                                                                }
-                                                            }
-                                                        },
-                                                        "UnityEnvironment.step": {
-                                                            "total": 0.05753250100008245,
-                                                            "count": 1,
-                                                            "is_parallel": true,
-                                                            "self": 0.0026428850000002058,
-                                                            "children": {
-                                                                "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.0005031310000731537,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.0005031310000731537
-                                                                },
-                                                                "communicator.exchange": {
-                                                                    "total": 0.04731931200001327,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.04731931200001327
-                                                                },
-                                                                "steps_from_proto": {
-                                                                    "total": 0.007067172999995819,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.0005673890000252868,
-                                                                    "children": {
-                                                                        "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.006499783999970532,
-                                                                            "count": 10,
-                                                                            "is_parallel": true,
-                                                                            "self": 0.006499783999970532
-                                                                        }
-                                                                    }
-                                                                }
-                                                            }
-                                                        }
-                                                    }
-                                                },
-                                                "UnityEnvironment.step": {
-                                                    "total": 325.1500898970062,
-                                                    "count": 18202,
-                                                    "is_parallel": true,
-                                                    "self": 15.278682513998433,
-                                                    "children": {
-                                                        "UnityEnvironment._generate_step_input": {
-                                                            "total": 7.886213973984923,
-                                                            "count": 18202,
-                                                            "is_parallel": true,
-                                                            "self": 7.886213973984923
-                                                        },
-                                                        "communicator.exchange": {
-                                                            "total": 255.72345804001293,
-                                                            "count": 18202,
-                                                            "is_parallel": true,
-                                                            "self": 255.72345804001293
-                                                        },
-                                                        "steps_from_proto": {
-                                                            "total": 46.2617353690099,
-                                                            "count": 18202,
-                                                            "is_parallel": true,
-                                                            "self": 9.199899673961909,
-                                                            "children": {
-                                                                "_process_rank_one_or_two_observation": {
-                                                                    "total": 37.06183569504799,
-                                                                    "count": 182020,
-                                                                    "is_parallel": true,
-                                                                    "self": 37.06183569504799
-                                                                }
-                                                            }
-                                                        }
-                                                    }
-                                                }
-                                            }
-                                        }
-                                    }
-                                }
-                            }
-                        }
-                    }
                 },
                 "trainer_threads": {
-                    "total": 0.00013422500001070148,
                     "count": 1,
-                    "self": 0.00013422500001070148,
-                    "children": {
-                        "thread_root": {
-                            "total": 0.0,
-                            "count": 0,
-                            "is_parallel": true,
-                            "self": 0.0,
-                            "children": {
-                                "trainer_advance": {
-                                    "total": 603.3576001671316,
-                                    "count": 787096,
-                                    "is_parallel": true,
-                                    "self": 18.87754923110151,
-                                    "children": {
-                                        "process_trajectory": {
-                                            "total": 321.9403706180301,
-                                            "count": 787096,
-                                            "is_parallel": true,
-                                            "self": 321.37840758902985,
-                                            "children": {
-                                                "RLTrainer._checkpoint": {
-                                                    "total": 0.5619630290002533,
-                                                    "count": 4,
-                                                    "is_parallel": true,
-                                                    "self": 0.5619630290002533
-                                                }
-                                            }
-                                        },
-                                        "_update_policy": {
-                                            "total": 262.539680318,
-                                            "count": 90,
-                                            "is_parallel": true,
-                                            "self": 68.92569046499761,
-                                            "children": {
-                                                "TorchPPOOptimizer.update": {
-                                                    "total": 193.6139898530024,
-                                                    "count": 4587,
-                                                    "is_parallel": true,
-                                                    "self": 193.6139898530024
-                                                }
-                                            }
-                                        }
-                                    }
-                                }
-                            }
-                        }
-                    }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.10131930100010322,
                     "count": 1,
-                    "self": 0.0012558180001178698,
-                    "children": {
-                        "RLTrainer._checkpoint": {
-                            "total": 0.10006348299998535,
-                            "count": 1,
-                            "self": 0.10006348299998535
-                        }
-                    }
                 }
             }
         }

 {
     "name": "root",
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1707941582",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.2.0+cu121",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1707941582"
     },
+    "total": 0.1519914749999316,
     "count": 1,
+    "self": 0.016260902999988502,
     "children": {
         "run_training.setup": {
+            "total": 0.07344121500000256,
             "count": 1,
+            "self": 0.07344121500000256
         },
         "TrainerController.start_learning": {
+            "total": 0.06228935699994054,
             "count": 1,
+            "self": 0.0007777309999710269,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 0.06149067399996966,
                     "count": 1,
+                    "self": 0.06149067399996966
                 },
                 "trainer_threads": {
+                    "total": 1.2639999340535724e-06,
                     "count": 1,
+                    "self": 1.2639999340535724e-06
                 },
                 "TrainerController._save_models": {
+                    "total": 1.9688000065798406e-05,
                     "count": 1,
+                    "self": 1.9688000065798406e-05
                 }
             }
         }

run_logs/training_status.json CHANGED Viewed

@@ -1,62 +1,4 @@
 {
-    "SnowballTarget": {
-        "checkpoints": [
-            {
-                "steps": 49936,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
-                "reward": 12.545454545454545,
-                "creation_time": 1707941813.3585904,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
-                ]
-            },
-            {
-                "steps": 99960,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
-                "reward": 20.272727272727273,
-                "creation_time": 1707941968.323758,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
-                ]
-            },
-            {
-                "steps": 149984,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
-                "reward": 24.727272727272727,
-                "creation_time": 1707942119.6343586,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
-                ]
-            },
-            {
-                "steps": 199984,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
-                "reward": 25.272727272727273,
-                "creation_time": 1707942273.4143367,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
-                ]
-            },
-            {
-                "steps": 200112,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
-                "reward": 25.272727272727273,
-                "creation_time": 1707942273.5439253,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
-                ]
-            }
-        ],
-        "final_checkpoint": {
-            "steps": 200112,
-            "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 25.272727272727273,
-            "creation_time": 1707942273.5439253,
-            "auxillary_file_paths": [
-                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
-            ]
-        }
-    },
     "metadata": {
         "stats_format_version": "0.3.0",
         "mlagents_version": "1.1.0.dev0",

 {
     "metadata": {
         "stats_format_version": "0.3.0",
         "mlagents_version": "1.1.0.dev0",