Trained Model v1.3

Browse files

Files changed (10) hide show

CubeChaseAgent.onnx +1 -1
CubeChaseAgent/CubeChaseAgent-121672.onnx +3 -0
CubeChaseAgent/CubeChaseAgent-121672.pt +3 -0
CubeChaseAgent/checkpoint.pt +2 -2
CubeChaseAgent/events.out.tfevents.1691414760.9d7388201558.1997.0 +3 -0
config.json +1 -1
configuration.yaml +1 -1
run_logs/Player-0.log +20 -21
run_logs/timers.json +162 -162
run_logs/training_status.json +8 -8

CubeChaseAgent.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:23a6f9e48182387337673e7c8d312ef50b43ea15c2dcd0e75f2df7e0bbc8ca27
 size 74450

 version https://git-lfs.github.com/spec/v1
+oid sha256:132123c61c6642ea47f2aec25937dd215b1624220c63b7e0c525b0fd1f0dccf0
 size 74450

CubeChaseAgent/CubeChaseAgent-121672.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:132123c61c6642ea47f2aec25937dd215b1624220c63b7e0c525b0fd1f0dccf0
+size 74450

CubeChaseAgent/CubeChaseAgent-121672.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:59b6b37974677128fc9ffedaa2ca02b7ca0ad5e65835ef40847eada6e3d0ffa2
+size 443355

CubeChaseAgent/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:416853c459b02cb0ac2792db719f9d9b2713dc40c95bec120a66edf2f803ee79
-size 443995

 version https://git-lfs.github.com/spec/v1
+oid sha256:59b6b37974677128fc9ffedaa2ca02b7ca0ad5e65835ef40847eada6e3d0ffa2
+size 443355

CubeChaseAgent/events.out.tfevents.1691414760.9d7388201558.1997.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:26ead0fe12af4b67b7ad32d685d0eaae11f5629a7a82b2cd17f967dc9236ed7a
+size 65797

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"CubeChaseAgent": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 10, "buffer_size": 100, "learning_rate": 0.0003, "beta": 0.0005, "epsilon": 0.2, "lambd": 0.99, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "constant", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 500000, "time_horizon": 64, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/CubeChase/CubeChase.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "CubeChasev1.2", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"CubeChaseAgent": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 10, "buffer_size": 100, "learning_rate": 0.0003, "beta": 0.0005, "epsilon": 0.2, "lambd": 0.99, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "constant", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 500000, "time_horizon": 64, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/CubeChase/CubeChase.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "CubeChasev1.3", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -64,7 +64,7 @@ engine_settings:
   no_graphics: true
 environment_parameters: null
 checkpoint_settings:
-  run_id: CubeChasev1.2
   initialize_from: null
   load_model: false
   resume: false

   no_graphics: true
 environment_parameters: null
 checkpoint_settings:
+  run_id: CubeChasev1.3
   initialize_from: null
   load_model: false
   resume: false

run_logs/Player-0.log CHANGED Viewed

@@ -34,7 +34,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.098 seconds
 ERROR: Shader Hidden/Universal Render Pipeline/Blit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Hidden/Universal Render Pipeline/CopyDepth shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Hidden/Universal Render Pipeline/Sampling shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -74,15 +74,14 @@ ERROR: Shader Universal Render Pipeline/Lit shader is not supported on this GPU
 WARNING: Shader Unsupported: 'Universal Render Pipeline/Lit' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.646957 ms
 requesting resize 84 x 84
-GRPC Exception: Status(StatusCode=Cancelled, Detail="CANCELLED"). Disconnecting from trainer.
 Setting up 1 worker threads for Enlighten.
 Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 972 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.3 MB
@@ -90,12 +89,12 @@ Memory Statistics:
     [ALLOC_TEMP_Loading.AsyncRead]
       Initial Block Size 64.0 KB
       Current Block Size 64.0 KB
-      Peak Allocated Bytes 256 B
       Overflow Count 0
     [ALLOC_TEMP_Loading.PreloadManager]
       Initial Block Size 256.0 KB
       Current Block Size 256.0 KB
-      Peak Allocated Bytes 141.2 KB
       Overflow Count 4
     [ALLOC_TEMP_Background Job.Worker 8]
       Initial Block Size 32.0 KB
@@ -202,18 +201,18 @@ Memory Statistics:
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
-      Peak Allocated bytes 1.2 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 973 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 20.8 MB
       Peak Large allocation bytes 16.0 MB
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [1.0 MB-2.0 MB]: 973 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 1.4 MB
       Peak Large allocation bytes 0 B
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -240,15 +239,15 @@ Memory Statistics:
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
-      Peak Allocated bytes 1.2 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 972 frames, [64.0 KB-128.0 KB]: 1 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 65.7 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 973 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 36.2 KB
@@ -258,33 +257,33 @@ Memory Statistics:
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
-      Peak Allocated bytes 1.2 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [1.0 MB-2.0 MB]: 972 frames, [4.0 MB-8.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 5.8 MB
       Peak Large allocation bytes 2.5 MB
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [256.0 KB-0.5 MB]: 972 frames, [1.0 MB-2.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
-      Peak Allocated memory 1.0 MB
       Peak Large allocation bytes 0 B
 [ALLOC_TYPETREE] Dual Thread Allocator
   Peak main deferred allocation count 0
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
-      Peak Allocated bytes 1.2 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 973 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.1 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [0-1.0 KB]: 973 frames
       Requested Block Size 2.0 MB
       Peak Block count 0
       Peak Allocated memory 0 B

 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.127 seconds
 ERROR: Shader Hidden/Universal Render Pipeline/Blit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Hidden/Universal Render Pipeline/CopyDepth shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Hidden/Universal Render Pipeline/Sampling shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Universal Render Pipeline/Lit' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 1.082538 ms
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [2.0 KB-4.0 KB]: 731 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.3 MB
     [ALLOC_TEMP_Loading.AsyncRead]
       Initial Block Size 64.0 KB
       Current Block Size 64.0 KB
+      Peak Allocated Bytes 240 B
       Overflow Count 0
     [ALLOC_TEMP_Loading.PreloadManager]
       Initial Block Size 256.0 KB
       Current Block Size 256.0 KB
+      Peak Allocated Bytes 157.5 KB
       Overflow Count 4
     [ALLOC_TEMP_Background Job.Worker 8]
       Initial Block Size 32.0 KB
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
+      Peak Allocated bytes 1.3 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 732 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 21.0 MB
       Peak Large allocation bytes 16.0 MB
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [1.0 MB-2.0 MB]: 732 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 1.5 MB
       Peak Large allocation bytes 0 B
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
+      Peak Allocated bytes 1.3 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 731 frames, [64.0 KB-128.0 KB]: 1 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 65.7 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 732 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 36.2 KB
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
+      Peak Allocated bytes 1.3 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [1.0 MB-2.0 MB]: 731 frames, [4.0 MB-8.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 5.8 MB
       Peak Large allocation bytes 2.5 MB
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 731 frames, [1.0 MB-2.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
+      Peak Allocated memory 1.6 MB
       Peak Large allocation bytes 0 B
 [ALLOC_TYPETREE] Dual Thread Allocator
   Peak main deferred allocation count 0
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
+      Peak Allocated bytes 1.3 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 732 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.1 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [0-1.0 KB]: 732 frames
       Requested Block Size 2.0 MB
       Peak Block count 0
       Peak Allocated memory 0 B

run_logs/timers.json CHANGED Viewed

@@ -2,213 +2,213 @@
     "name": "root",
     "gauges": {
         "CubeChaseAgent.Policy.Entropy.mean": {
-            "value": 1.3304638862609863,
-            "min": 1.3304638862609863,
-            "max": 1.4406789541244507,
-            "count": 8
         },
         "CubeChaseAgent.Policy.Entropy.sum": {
-            "value": 13371.162109375,
-            "min": 13371.162109375,
-            "max": 14743.5654296875,
-            "count": 8
         },
         "CubeChaseAgent.Environment.EpisodeLength.mean": {
-            "value": 2.8197408536585367,
-            "min": 2.8197408536585367,
-            "max": 12.106159895150721,
-            "count": 8
         },
         "CubeChaseAgent.Environment.EpisodeLength.sum": {
-            "value": 7399.0,
-            "min": 7399.0,
-            "max": 9237.0,
-            "count": 8
         },
         "CubeChaseAgent.Step.mean": {
-            "value": 79997.0,
-            "min": 9990.0,
-            "max": 79997.0,
-            "count": 8
         },
         "CubeChaseAgent.Step.sum": {
-            "value": 79997.0,
-            "min": 9990.0,
-            "max": 79997.0,
-            "count": 8
         },
         "CubeChaseAgent.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 0.9831324219703674,
-            "min": 0.43312692642211914,
-            "max": 0.9832891821861267,
-            "count": 8
         },
         "CubeChaseAgent.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2575.806884765625,
-            "min": 330.042724609375,
-            "max": 2575.806884765625,
-            "count": 8
         },
         "CubeChaseAgent.Environment.CumulativeReward.mean": {
-            "value": 0.9977099236641221,
-            "min": 0.5078740157480315,
-            "max": 0.9992038216560509,
-            "count": 8
         },
         "CubeChaseAgent.Environment.CumulativeReward.sum": {
-            "value": 2614.0,
-            "min": 387.0,
-            "max": 2614.0,
-            "count": 8
         },
         "CubeChaseAgent.Policy.ExtrinsicReward.mean": {
-            "value": 0.9977099236641221,
-            "min": 0.5078740157480315,
-            "max": 0.9992038216560509,
-            "count": 8
         },
         "CubeChaseAgent.Policy.ExtrinsicReward.sum": {
-            "value": 2614.0,
-            "min": 387.0,
-            "max": 2614.0,
-            "count": 8
         },
         "CubeChaseAgent.Losses.PolicyLoss.mean": {
-            "value": 0.2412640100830578,
-            "min": 0.2364040109031282,
-            "max": 0.2443406546307238,
-            "count": 8
         },
         "CubeChaseAgent.Losses.PolicyLoss.sum": {
-            "value": 22.92008095789049,
-            "min": 21.813553494995514,
-            "max": 23.20331698343004,
-            "count": 8
         },
         "CubeChaseAgent.Losses.ValueLoss.mean": {
-            "value": 0.0026035018763841144,
-            "min": 0.0011506950352082983,
-            "max": 0.08874128673615443,
-            "count": 8
         },
         "CubeChaseAgent.Losses.ValueLoss.sum": {
-            "value": 0.24733267825649086,
-            "min": 0.11046672337999663,
-            "max": 7.986715806253899,
-            "count": 8
         },
         "CubeChaseAgent.Policy.LearningRate.mean": {
-            "value": 0.00025501817920447155,
-            "min": 0.00025501817920447155,
-            "max": 0.00029694244768585103,
-            "count": 8
         },
         "CubeChaseAgent.Policy.LearningRate.sum": {
-            "value": 0.0242267270244248,
-            "min": 0.0242267270244248,
-            "max": 0.0270760528746492,
-            "count": 8
         },
         "CubeChaseAgent.Policy.Epsilon.mean": {
-            "value": 0.18500605473684215,
-            "min": 0.18500605473684215,
-            "max": 0.19898081555555558,
-            "count": 8
         },
         "CubeChaseAgent.Policy.Epsilon.sum": {
-            "value": 17.575575200000003,
-            "min": 17.575575200000003,
-            "max": 18.5282962,
-            "count": 8
         },
         "CubeChaseAgent.Policy.Beta.mean": {
             "value": 0.0005000000000000001,
             "min": 0.0005000000000000001,
             "max": 0.0005000000000000001,
-            "count": 8
         },
         "CubeChaseAgent.Policy.Beta.sum": {
-            "value": 0.047500000000000014,
-            "min": 0.04500000000000001,
-            "max": 0.048000000000000015,
-            "count": 8
         },
         "CubeChaseAgent.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 8
         },
         "CubeChaseAgent.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 8
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1691412635",
         "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./ml-agents/config/ppo/CubeChase.yaml --env=./training-envs-executables/linux/CubeChase/CubeChase.x86_64 --run-id=CubeChasev1.2 --no-graphics --force",
         "mlagents_version": "0.31.0.dev0",
         "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.11.0+cu102",
         "numpy_version": "1.21.2",
-        "end_time_seconds": "1691412880"
     },
-    "total": 245.83182224499996,
     "count": 1,
-    "self": 0.4245115729999611,
     "children": {
         "run_training.setup": {
-            "total": 0.04349833100002343,
             "count": 1,
-            "self": 0.04349833100002343
         },
         "TrainerController.start_learning": {
-            "total": 245.36381234099997,
             "count": 1,
-            "self": 0.2728475159973982,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 6.391924240000037,
                     "count": 1,
-                    "self": 6.391924240000037
                 },
                 "TrainerController.advance": {
-                    "total": 238.47294238400252,
-                    "count": 11102,
-                    "self": 0.22291748600707706,
                     "children": {
                         "env_step": {
-                            "total": 46.25549591399539,
-                            "count": 11102,
-                            "self": 44.18142690399924,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 1.9414303580004457,
-                                    "count": 11102,
-                                    "self": 0.2282176760034531,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 1.7132126819969926,
-                                            "count": 1621,
-                                            "self": 1.7132126819969926
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.13263865199570546,
-                                    "count": 11101,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 244.76964477900037,
-                                            "count": 11101,
                                             "is_parallel": true,
-                                            "self": 212.69376319200012,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.0012042240000482707,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0002967720000697227,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.000907451999978548,
                                                                     "count": 2,
                                                                     "is_parallel": true,
-                                                                    "self": 0.000907451999978548
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.04441783600003646,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.00019538599997304118,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.0011486580000337199,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0011486580000337199
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.04265053000000307,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.04265053000000307
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.0004232620000266252,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0001985210000157167,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.00022474100001090846,
                                                                             "count": 2,
                                                                             "is_parallel": true,
-                                                                            "self": 0.00022474100001090846
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 32.075881587000254,
-                                                    "count": 11100,
                                                     "is_parallel": true,
-                                                    "self": 1.7562732710036357,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 1.98411509000357,
-                                                            "count": 11100,
                                                             "is_parallel": true,
-                                                            "self": 1.98411509000357
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 24.525806725998393,
-                                                            "count": 11100,
                                                             "is_parallel": true,
-                                                            "self": 24.525806725998393
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 3.8096864999946547,
-                                                            "count": 11100,
                                                             "is_parallel": true,
-                                                            "self": 1.7021175089816438,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 2.107568991013011,
-                                                                    "count": 22200,
                                                                     "is_parallel": true,
-                                                                    "self": 2.107568991013011
                                                                 }
                                                             }
                                                         }
@@ -307,24 +307,24 @@
                             }
                         },
                         "trainer_advance": {
-                            "total": 191.99452898400006,
-                            "count": 11101,
-                            "self": 0.25941598700370605,
                             "children": {
                                 "process_trajectory": {
-                                    "total": 30.366022278994308,
-                                    "count": 11101,
-                                    "self": 30.366022278994308
                                 },
                                 "_update_policy": {
-                                    "total": 161.36909071800204,
-                                    "count": 763,
-                                    "self": 16.34106925999839,
                                     "children": {
                                         "TorchPPOOptimizer.update": {
-                                            "total": 145.02802145800365,
-                                            "count": 23370,
-                                            "self": 145.02802145800365
                                         }
                                     }
                                 }
@@ -333,19 +333,19 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 1.247000000148546e-06,
                     "count": 1,
-                    "self": 1.247000000148546e-06
                 },
                 "TrainerController._save_models": {
-                    "total": 0.22609695400001328,
                     "count": 1,
-                    "self": 0.0005307090000314929,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.2255662449999818,
                             "count": 1,
-                            "self": 0.2255662449999818
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "CubeChaseAgent.Policy.Entropy.mean": {
+            "value": 1.3624736070632935,
+            "min": 1.3624736070632935,
+            "max": 1.426416277885437,
+            "count": 12
         },
         "CubeChaseAgent.Policy.Entropy.sum": {
+            "value": 13488.48828125,
+            "min": 13350.98828125,
+            "max": 16555.53515625,
+            "count": 12
         },
         "CubeChaseAgent.Environment.EpisodeLength.mean": {
+            "value": 5.258911819887429,
+            "min": 5.258911819887429,
+            "max": 26.4585635359116,
+            "count": 12
         },
         "CubeChaseAgent.Environment.EpisodeLength.sum": {
+            "value": 8409.0,
+            "min": 8409.0,
+            "max": 9599.0,
+            "count": 12
         },
         "CubeChaseAgent.Step.mean": {
+            "value": 119998.0,
+            "min": 9974.0,
+            "max": 119998.0,
+            "count": 12
         },
         "CubeChaseAgent.Step.sum": {
+            "value": 119998.0,
+            "min": 9974.0,
+            "max": 119998.0,
+            "count": 12
         },
         "CubeChaseAgent.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 0.9679732918739319,
+            "min": 0.15101228654384613,
+            "max": 0.9679732918739319,
+            "count": 12
         },
         "CubeChaseAgent.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 1546.8212890625,
+            "min": 55.119483947753906,
+            "max": 1546.8212890625,
+            "count": 12
         },
         "CubeChaseAgent.Environment.CumulativeReward.mean": {
+            "value": 0.9949937421777222,
+            "min": 0.20498614958448755,
+            "max": 0.9949937421777222,
+            "count": 12
         },
         "CubeChaseAgent.Environment.CumulativeReward.sum": {
+            "value": 1590.0,
+            "min": 74.0,
+            "max": 1590.0,
+            "count": 12
         },
         "CubeChaseAgent.Policy.ExtrinsicReward.mean": {
+            "value": 0.9949937421777222,
+            "min": 0.20498614958448755,
+            "max": 0.9949937421777222,
+            "count": 12
         },
         "CubeChaseAgent.Policy.ExtrinsicReward.sum": {
+            "value": 1590.0,
+            "min": 74.0,
+            "max": 1590.0,
+            "count": 12
         },
         "CubeChaseAgent.Losses.PolicyLoss.mean": {
+            "value": 0.24009240636568133,
+            "min": 0.2346602955969273,
+            "max": 0.24759637916873814,
+            "count": 12
         },
         "CubeChaseAgent.Losses.PolicyLoss.sum": {
+            "value": 22.088501385642683,
+            "min": 19.66620900576534,
+            "max": 22.539351797162563,
+            "count": 12
         },
         "CubeChaseAgent.Losses.ValueLoss.mean": {
+            "value": 0.004534491502782299,
+            "min": 0.004534491502782299,
+            "max": 0.09943730601449394,
+            "count": 12
         },
         "CubeChaseAgent.Losses.ValueLoss.sum": {
+            "value": 0.41717321825597153,
+            "min": 0.41717321825597153,
+            "max": 8.84992023528996,
+            "count": 12
         },
         "CubeChaseAgent.Policy.LearningRate.mean": {
+            "value": 0.00023097265126999355,
+            "min": 0.00023097265126999355,
+            "max": 0.00029695498620019013,
+            "count": 12
         },
         "CubeChaseAgent.Policy.LearningRate.sum": {
+            "value": 0.021249483916839406,
+            "min": 0.021249483916839406,
+            "max": 0.025365034644988595,
+            "count": 12
         },
         "CubeChaseAgent.Policy.Epsilon.mean": {
+            "value": 0.17699087608695654,
+            "min": 0.17699087608695654,
+            "max": 0.1989849950617284,
+            "count": 12
         },
         "CubeChaseAgent.Policy.Epsilon.sum": {
+            "value": 16.283160600000002,
+            "min": 16.1177846,
+            "max": 17.3550114,
+            "count": 12
         },
         "CubeChaseAgent.Policy.Beta.mean": {
             "value": 0.0005000000000000001,
             "min": 0.0005000000000000001,
             "max": 0.0005000000000000001,
+            "count": 12
         },
         "CubeChaseAgent.Policy.Beta.sum": {
+            "value": 0.04600000000000001,
+            "min": 0.04050000000000001,
+            "max": 0.046500000000000014,
+            "count": 12
         },
         "CubeChaseAgent.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 12
         },
         "CubeChaseAgent.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 12
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1691414757",
         "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./ml-agents/config/ppo/CubeChase.yaml --env=./training-envs-executables/linux/CubeChase/CubeChase.x86_64 --run-id=CubeChasev1.3 --no-graphics --force",
         "mlagents_version": "0.31.0.dev0",
         "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.11.0+cu102",
         "numpy_version": "1.21.2",
+        "end_time_seconds": "1691415061"
     },
+    "total": 304.81222622700005,
     "count": 1,
+    "self": 0.46280846799999154,
     "children": {
         "run_training.setup": {
+            "total": 0.0594958140000017,
             "count": 1,
+            "self": 0.0594958140000017
         },
         "TrainerController.start_learning": {
+            "total": 304.28992194500006,
             "count": 1,
+            "self": 0.382598396000958,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 3.227173139999991,
                     "count": 1,
+                    "self": 3.227173139999991
                 },
                 "TrainerController.advance": {
+                    "total": 300.526569009999,
+                    "count": 8204,
+                    "self": 0.30370839101044567,
                     "children": {
                         "env_step": {
+                            "total": 74.41745272699035,
+                            "count": 8204,
+                            "self": 72.32699915599204,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 1.9106632459952948,
+                                    "count": 8204,
+                                    "self": 0.34805083399578507,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 1.5626124119995097,
+                                            "count": 1220,
+                                            "self": 1.5626124119995097
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.17979032500301173,
+                                    "count": 8203,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 303.55578765400156,
+                                            "count": 8203,
                                             "is_parallel": true,
+                                            "self": 249.32149769899894,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.0023363349999954153,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0005835759999968104,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0017527589999986048,
                                                                     "count": 2,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0017527589999986048
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.04357546699998238,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0008867889999919498,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.002490550000004532,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.002490550000004532
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.038356634999956896,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.038356634999956896
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0018414930000290042,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.00047727599996960635,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0013642170000593978,
                                                                             "count": 2,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0013642170000593978
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 54.23428995500262,
+                                                    "count": 8202,
                                                     "is_parallel": true,
+                                                    "self": 2.723056837997717,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 3.282884594002894,
+                                                            "count": 8202,
                                                             "is_parallel": true,
+                                                            "self": 3.282884594002894
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 42.81378735900262,
+                                                            "count": 8202,
                                                             "is_parallel": true,
+                                                            "self": 42.81378735900262
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 5.4145611639993945,
+                                                            "count": 8202,
                                                             "is_parallel": true,
+                                                            "self": 2.0002190260005364,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 3.414342137998858,
+                                                                    "count": 16404,
                                                                     "is_parallel": true,
+                                                                    "self": 3.414342137998858
                                                                 }
                                                             }
                                                         }
                             }
                         },
                         "trainer_advance": {
+                            "total": 225.8054078919982,
+                            "count": 8203,
+                            "self": 0.4546590880020176,
                             "children": {
                                 "process_trajectory": {
+                                    "total": 29.880287868995254,
+                                    "count": 8203,
+                                    "self": 29.880287868995254
                                 },
                                 "_update_policy": {
+                                    "total": 195.47046093500092,
+                                    "count": 1083,
+                                    "self": 32.75555481800484,
                                     "children": {
                                         "TorchPPOOptimizer.update": {
+                                            "total": 162.71490611699608,
+                                            "count": 35064,
+                                            "self": 162.71490611699608
                                         }
                                     }
                                 }
                     }
                 },
                 "trainer_threads": {
+                    "total": 1.627000074222451e-06,
                     "count": 1,
+                    "self": 1.627000074222451e-06
                 },
                 "TrainerController._save_models": {
+                    "total": 0.15357977200005735,
                     "count": 1,
+                    "self": 0.006318809000049441,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.1472609630000079,
                             "count": 1,
+                            "self": 0.1472609630000079
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -2,22 +2,22 @@
     "CubeChaseAgent": {
         "checkpoints": [
             {
-                "steps": 80967,
-                "file_path": "results/CubeChasev1.2/CubeChaseAgent/CubeChaseAgent-80967.onnx",
                 "reward": 1.0,
-                "creation_time": 1691412880.5270169,
                 "auxillary_file_paths": [
-                    "results/CubeChasev1.2/CubeChaseAgent/CubeChaseAgent-80967.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 80967,
-            "file_path": "results/CubeChasev1.2/CubeChaseAgent.onnx",
             "reward": 1.0,
-            "creation_time": 1691412880.5270169,
             "auxillary_file_paths": [
-                "results/CubeChasev1.2/CubeChaseAgent/CubeChaseAgent-80967.pt"
             ]
         }
     },

     "CubeChaseAgent": {
         "checkpoints": [
             {
+                "steps": 121672,
+                "file_path": "results/CubeChasev1.3/CubeChaseAgent/CubeChaseAgent-121672.onnx",
                 "reward": 1.0,
+                "creation_time": 1691415061.3471987,
                 "auxillary_file_paths": [
+                    "results/CubeChasev1.3/CubeChaseAgent/CubeChaseAgent-121672.pt"
                 ]
             }
         ],
         "final_checkpoint": {
+            "steps": 121672,
+            "file_path": "results/CubeChasev1.3/CubeChaseAgent.onnx",
             "reward": 1.0,
+            "creation_time": 1691415061.3471987,
             "auxillary_file_paths": [
+                "results/CubeChasev1.3/CubeChaseAgent/CubeChaseAgent-121672.pt"
             ]
         }
     },