FredericProtat commited on
Commit
d98cc7f
·
1 Parent(s): 7909737
Huggy.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15dfb1a0eea5fdecb539043119bed4c9b793951ada569f059b4864af3a8cc0cc
3
- size 2271327
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce8c7f97dc43e15d15cd648601dd2e07bf7b40ab921e49c1908d66a43e291f91
3
+ size 17130437
Huggy/Huggy-1000048.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce8c7f97dc43e15d15cd648601dd2e07bf7b40ab921e49c1908d66a43e291f91
3
+ size 17130437
Huggy/Huggy-1000048.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fa7aebe474b4fba2dac6ed32a4e1748b968f13d635ebbf5c9fc888a67cc2d88
3
+ size 102538205
Huggy/Huggy-499998.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:243dd70101a42fe8ec2819cd73e112b1ab82c20273a9af515f098a4e2963fbed
3
+ size 17130437
Huggy/Huggy-499998.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7289682653a16e6ad66a826f56b72d58ac077f625fc096567c86bebb7947dfe6
3
+ size 102538205
Huggy/Huggy-999997.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5604cb29966e75b960c911fc9417194e37df089f044ffe43ab396d0e66f5c5fb
3
+ size 17130437
Huggy/Huggy-999997.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a269af3e15bab4d790f7a6565c026b8dec94fbfcbd28a88d6e2e9e99d24068db
3
+ size 102538205
Huggy/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc4292410326352e5b523c7db19be8a2ebdb33e4b62f408386e321fd30803fbe
3
- size 13503717
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fa7aebe474b4fba2dac6ed32a4e1748b968f13d635ebbf5c9fc888a67cc2d88
3
+ size 102538205
Huggy/events.out.tfevents.1690712863.d4b470349a0e.1571.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f827195b3d24c68f712100a7a87144f204dbece54f575817a7bbcf38140244b
3
+ size 156882
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"Huggy": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 200000, "network_settings": {"normalize": true, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 15, "even_checkpoints": false, "max_steps": 2000000, "time_horizon": 1000, "summary_freq": 50000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./trained-envs-executables/linux/Huggy/Huggy", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "Huggy", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"Huggy": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 1024, "num_layers": 5, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 15, "even_checkpoints": false, "max_steps": 1000000, "time_horizon": 1000, "summary_freq": 50000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./trained-envs-executables/linux/Huggy/Huggy", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "Huggy", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -14,11 +14,11 @@ behaviors:
14
  learning_rate_schedule: linear
15
  beta_schedule: linear
16
  epsilon_schedule: linear
17
- checkpoint_interval: 200000
18
  network_settings:
19
  normalize: true
20
- hidden_units: 512
21
- num_layers: 3
22
  vis_encode_type: simple
23
  memory: null
24
  goal_conditioning_type: hyper
@@ -38,7 +38,7 @@ behaviors:
38
  init_path: null
39
  keep_checkpoints: 15
40
  even_checkpoints: false
41
- max_steps: 2000000
42
  time_horizon: 1000
43
  summary_freq: 50000
44
  threaded: false
 
14
  learning_rate_schedule: linear
15
  beta_schedule: linear
16
  epsilon_schedule: linear
17
+ checkpoint_interval: 500000
18
  network_settings:
19
  normalize: true
20
+ hidden_units: 1024
21
+ num_layers: 5
22
  vis_encode_type: simple
23
  memory: null
24
  goal_conditioning_type: hyper
 
38
  init_path: null
39
  keep_checkpoints: 15
40
  even_checkpoints: false
41
+ max_steps: 1000000
42
  time_horizon: 1000
43
  summary_freq: 50000
44
  threaded: false
run_logs/Player-0.log CHANGED
@@ -34,7 +34,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
34
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
35
  FMOD initialized on nosound output
36
  Begin MonoManager ReloadAssembly
37
- - Completed reload, in 0.122 seconds
38
  ERROR: Shader Hidden/Universal Render Pipeline/Blit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
39
  ERROR: Shader Hidden/Universal Render Pipeline/CopyDepth shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
40
  ERROR: Shader Hidden/Universal Render Pipeline/ScreenSpaceShadows shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -78,14 +78,14 @@ ERROR: Shader Universal Render Pipeline/Lit shader is not supported on this GPU
78
  WARNING: Shader Unsupported: 'Universal Render Pipeline/Lit' - All subshaders removed
79
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
80
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
81
- UnloadTime: 0.800380 ms
82
  requesting resize 84 x 84
83
  Setting up 1 worker threads for Enlighten.
84
  Memory Statistics:
85
  [ALLOC_TEMP_TLS] TLS Allocator
86
  StackAllocators :
87
  [ALLOC_TEMP_MAIN]
88
- Peak usage frame count: [4.0 KB-8.0 KB]: 26761 frames, [2.0 MB-4.0 MB]: 1 frames
89
  Initial Block Size 4.0 MB
90
  Current Block Size 4.0 MB
91
  Peak Allocated Bytes 3.6 MB
@@ -93,7 +93,7 @@ Memory Statistics:
93
  [ALLOC_TEMP_Loading.AsyncRead]
94
  Initial Block Size 64.0 KB
95
  Current Block Size 64.0 KB
96
- Peak Allocated Bytes 240 B
97
  Overflow Count 0
98
  [ALLOC_TEMP_Loading.PreloadManager]
99
  Initial Block Size 256.0 KB
@@ -201,22 +201,22 @@ Memory Statistics:
201
  Peak Allocated Bytes 0 B
202
  Overflow Count 0
203
  [ALLOC_DEFAULT] Dual Thread Allocator
204
- Peak main deferred allocation count 269
205
  [ALLOC_BUCKET]
206
  Large Block size 4.0 MB
207
  Used Block count 1
208
  Peak Allocated bytes 1.4 MB
209
  [ALLOC_DEFAULT_MAIN]
210
- Peak usage frame count: [16.0 MB-32.0 MB]: 26762 frames
211
  Requested Block Size 16.0 MB
212
  Peak Block count 1
213
- Peak Allocated memory 23.5 MB
214
  Peak Large allocation bytes 16.0 MB
215
  [ALLOC_DEFAULT_THREAD]
216
- Peak usage frame count: [2.0 MB-4.0 MB]: 26762 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
- Peak Allocated memory 2.5 MB
220
  Peak Large allocation bytes 0 B
221
  [ALLOC_TEMP_JOB_1_FRAME]
222
  Initial Block Size 2.0 MB
@@ -245,13 +245,13 @@ Memory Statistics:
245
  Used Block count 1
246
  Peak Allocated bytes 1.4 MB
247
  [ALLOC_GFX_MAIN]
248
- Peak usage frame count: [32.0 KB-64.0 KB]: 26761 frames, [64.0 KB-128.0 KB]: 1 frames
249
  Requested Block Size 16.0 MB
250
  Peak Block count 1
251
  Peak Allocated memory 65.6 KB
252
  Peak Large allocation bytes 0 B
253
  [ALLOC_GFX_THREAD]
254
- Peak usage frame count: [64.0 KB-128.0 KB]: 26762 frames
255
  Requested Block Size 16.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 81.8 KB
@@ -263,13 +263,13 @@ Memory Statistics:
263
  Used Block count 1
264
  Peak Allocated bytes 1.4 MB
265
  [ALLOC_CACHEOBJECTS_MAIN]
266
- Peak usage frame count: [1.0 MB-2.0 MB]: 26761 frames, [16.0 MB-32.0 MB]: 1 frames
267
  Requested Block Size 4.0 MB
268
  Peak Block count 2
269
  Peak Allocated memory 30.6 MB
270
  Peak Large allocation bytes 24.9 MB
271
  [ALLOC_CACHEOBJECTS_THREAD]
272
- Peak usage frame count: [0.5 MB-1.0 MB]: 26761 frames, [2.0 MB-4.0 MB]: 1 frames
273
  Requested Block Size 4.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 2.6 MB
@@ -281,13 +281,13 @@ Memory Statistics:
281
  Used Block count 1
282
  Peak Allocated bytes 1.4 MB
283
  [ALLOC_TYPETREE_MAIN]
284
- Peak usage frame count: [0-1.0 KB]: 26762 frames
285
  Requested Block Size 2.0 MB
286
  Peak Block count 1
287
  Peak Allocated memory 1.0 KB
288
  Peak Large allocation bytes 0 B
289
  [ALLOC_TYPETREE_THREAD]
290
- Peak usage frame count: [4.0 KB-8.0 KB]: 26762 frames
291
  Requested Block Size 2.0 MB
292
  Peak Block count 1
293
  Peak Allocated memory 7.3 KB
 
34
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
35
  FMOD initialized on nosound output
36
  Begin MonoManager ReloadAssembly
37
+ - Completed reload, in 0.087 seconds
38
  ERROR: Shader Hidden/Universal Render Pipeline/Blit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
39
  ERROR: Shader Hidden/Universal Render Pipeline/CopyDepth shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
40
  ERROR: Shader Hidden/Universal Render Pipeline/ScreenSpaceShadows shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
78
  WARNING: Shader Unsupported: 'Universal Render Pipeline/Lit' - All subshaders removed
79
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
80
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
81
+ UnloadTime: 0.796061 ms
82
  requesting resize 84 x 84
83
  Setting up 1 worker threads for Enlighten.
84
  Memory Statistics:
85
  [ALLOC_TEMP_TLS] TLS Allocator
86
  StackAllocators :
87
  [ALLOC_TEMP_MAIN]
88
+ Peak usage frame count: [4.0 KB-8.0 KB]: 13381 frames, [2.0 MB-4.0 MB]: 1 frames
89
  Initial Block Size 4.0 MB
90
  Current Block Size 4.0 MB
91
  Peak Allocated Bytes 3.6 MB
 
93
  [ALLOC_TEMP_Loading.AsyncRead]
94
  Initial Block Size 64.0 KB
95
  Current Block Size 64.0 KB
96
+ Peak Allocated Bytes 184 B
97
  Overflow Count 0
98
  [ALLOC_TEMP_Loading.PreloadManager]
99
  Initial Block Size 256.0 KB
 
201
  Peak Allocated Bytes 0 B
202
  Overflow Count 0
203
  [ALLOC_DEFAULT] Dual Thread Allocator
204
+ Peak main deferred allocation count 250
205
  [ALLOC_BUCKET]
206
  Large Block size 4.0 MB
207
  Used Block count 1
208
  Peak Allocated bytes 1.4 MB
209
  [ALLOC_DEFAULT_MAIN]
210
+ Peak usage frame count: [16.0 MB-32.0 MB]: 13382 frames
211
  Requested Block Size 16.0 MB
212
  Peak Block count 1
213
+ Peak Allocated memory 22.3 MB
214
  Peak Large allocation bytes 16.0 MB
215
  [ALLOC_DEFAULT_THREAD]
216
+ Peak usage frame count: [2.0 MB-4.0 MB]: 13382 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
+ Peak Allocated memory 2.6 MB
220
  Peak Large allocation bytes 0 B
221
  [ALLOC_TEMP_JOB_1_FRAME]
222
  Initial Block Size 2.0 MB
 
245
  Used Block count 1
246
  Peak Allocated bytes 1.4 MB
247
  [ALLOC_GFX_MAIN]
248
+ Peak usage frame count: [32.0 KB-64.0 KB]: 13381 frames, [64.0 KB-128.0 KB]: 1 frames
249
  Requested Block Size 16.0 MB
250
  Peak Block count 1
251
  Peak Allocated memory 65.6 KB
252
  Peak Large allocation bytes 0 B
253
  [ALLOC_GFX_THREAD]
254
+ Peak usage frame count: [64.0 KB-128.0 KB]: 13382 frames
255
  Requested Block Size 16.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 81.8 KB
 
263
  Used Block count 1
264
  Peak Allocated bytes 1.4 MB
265
  [ALLOC_CACHEOBJECTS_MAIN]
266
+ Peak usage frame count: [1.0 MB-2.0 MB]: 13381 frames, [16.0 MB-32.0 MB]: 1 frames
267
  Requested Block Size 4.0 MB
268
  Peak Block count 2
269
  Peak Allocated memory 30.6 MB
270
  Peak Large allocation bytes 24.9 MB
271
  [ALLOC_CACHEOBJECTS_THREAD]
272
+ Peak usage frame count: [0.5 MB-1.0 MB]: 13381 frames, [2.0 MB-4.0 MB]: 1 frames
273
  Requested Block Size 4.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 2.6 MB
 
281
  Used Block count 1
282
  Peak Allocated bytes 1.4 MB
283
  [ALLOC_TYPETREE_MAIN]
284
+ Peak usage frame count: [0-1.0 KB]: 13382 frames
285
  Requested Block Size 2.0 MB
286
  Peak Block count 1
287
  Peak Allocated memory 1.0 KB
288
  Peak Large allocation bytes 0 B
289
  [ALLOC_TYPETREE_THREAD]
290
+ Peak usage frame count: [4.0 KB-8.0 KB]: 13382 frames
291
  Requested Block Size 2.0 MB
292
  Peak Block count 1
293
  Peak Allocated memory 7.3 KB
run_logs/timers.json CHANGED
@@ -2,153 +2,153 @@
2
  "name": "root",
3
  "gauges": {
4
  "Huggy.Policy.Entropy.mean": {
5
- "value": 1.403953194618225,
6
- "min": 1.403953194618225,
7
- "max": 1.4273483753204346,
8
- "count": 40
9
  },
10
  "Huggy.Policy.Entropy.sum": {
11
- "value": 70023.5703125,
12
- "min": 68967.328125,
13
- "max": 78737.78125,
14
- "count": 40
15
  },
16
  "Huggy.Environment.EpisodeLength.mean": {
17
- "value": 82.39732888146912,
18
- "min": 74.20902255639098,
19
- "max": 379.54545454545456,
20
- "count": 40
21
  },
22
  "Huggy.Environment.EpisodeLength.sum": {
23
- "value": 49356.0,
24
- "min": 48783.0,
25
- "max": 50100.0,
26
- "count": 40
27
  },
28
  "Huggy.Step.mean": {
29
- "value": 1999998.0,
30
- "min": 49635.0,
31
- "max": 1999998.0,
32
- "count": 40
33
  },
34
  "Huggy.Step.sum": {
35
- "value": 1999998.0,
36
- "min": 49635.0,
37
- "max": 1999998.0,
38
- "count": 40
39
  },
40
  "Huggy.Policy.ExtrinsicValueEstimate.mean": {
41
- "value": 2.5261740684509277,
42
- "min": 0.1426374763250351,
43
- "max": 2.556769847869873,
44
- "count": 40
45
  },
46
  "Huggy.Policy.ExtrinsicValueEstimate.sum": {
47
- "value": 1513.17822265625,
48
- "min": 18.685508728027344,
49
- "max": 1649.146240234375,
50
- "count": 40
51
  },
52
  "Huggy.Environment.CumulativeReward.mean": {
53
- "value": 3.7853312678448545,
54
- "min": 1.7595527622535938,
55
- "max": 4.040156982260302,
56
- "count": 40
57
  },
58
  "Huggy.Environment.CumulativeReward.sum": {
59
- "value": 2267.413429439068,
60
- "min": 230.5014118552208,
61
- "max": 2602.952577829361,
62
- "count": 40
63
  },
64
  "Huggy.Policy.ExtrinsicReward.mean": {
65
- "value": 3.7853312678448545,
66
- "min": 1.7595527622535938,
67
- "max": 4.040156982260302,
68
- "count": 40
69
  },
70
  "Huggy.Policy.ExtrinsicReward.sum": {
71
- "value": 2267.413429439068,
72
- "min": 230.5014118552208,
73
- "max": 2602.952577829361,
74
- "count": 40
75
  },
76
  "Huggy.Losses.PolicyLoss.mean": {
77
- "value": 0.017877208416272574,
78
- "min": 0.014155605591561956,
79
- "max": 0.020184158803507067,
80
- "count": 40
81
  },
82
  "Huggy.Losses.PolicyLoss.sum": {
83
- "value": 0.053631625248817726,
84
- "min": 0.02831121118312391,
85
- "max": 0.0551270124381214,
86
- "count": 40
87
  },
88
  "Huggy.Losses.ValueLoss.mean": {
89
- "value": 0.05461679117547141,
90
- "min": 0.021587439626455304,
91
- "max": 0.06425863206386566,
92
- "count": 40
93
  },
94
  "Huggy.Losses.ValueLoss.sum": {
95
- "value": 0.16385037352641424,
96
- "min": 0.04317487925291061,
97
- "max": 0.17508697621524333,
98
- "count": 40
99
  },
100
  "Huggy.Policy.LearningRate.mean": {
101
- "value": 3.776248741283334e-06,
102
- "min": 3.776248741283334e-06,
103
- "max": 0.0002952900765699749,
104
- "count": 40
105
  },
106
  "Huggy.Policy.LearningRate.sum": {
107
- "value": 1.1328746223850001e-05,
108
- "min": 1.1328746223850001e-05,
109
- "max": 0.0008439145686951499,
110
- "count": 40
111
  },
112
  "Huggy.Policy.Epsilon.mean": {
113
- "value": 0.10125871666666668,
114
- "min": 0.10125871666666668,
115
- "max": 0.198430025,
116
- "count": 40
117
  },
118
  "Huggy.Policy.Epsilon.sum": {
119
- "value": 0.30377615,
120
- "min": 0.20767055,
121
- "max": 0.5813048500000001,
122
- "count": 40
123
  },
124
  "Huggy.Policy.Beta.mean": {
125
- "value": 7.280996166666668e-05,
126
- "min": 7.280996166666668e-05,
127
- "max": 0.0049216582475,
128
- "count": 40
129
  },
130
  "Huggy.Policy.Beta.sum": {
131
- "value": 0.00021842988500000006,
132
- "min": 0.00021842988500000006,
133
- "max": 0.014067112015000001,
134
- "count": 40
135
  },
136
  "Huggy.IsTraining.mean": {
137
  "value": 1.0,
138
  "min": 1.0,
139
  "max": 1.0,
140
- "count": 40
141
  },
142
  "Huggy.IsTraining.sum": {
143
  "value": 1.0,
144
  "min": 1.0,
145
  "max": 1.0,
146
- "count": 40
147
  }
148
  },
149
  "metadata": {
150
  "timer_format_version": "0.1.0",
151
- "start_time_seconds": "1690583267",
152
  "python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
153
  "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy --no-graphics",
154
  "mlagents_version": "0.31.0.dev0",
@@ -156,59 +156,59 @@
156
  "communication_protocol_version": "1.5.0",
157
  "pytorch_version": "1.11.0+cu102",
158
  "numpy_version": "1.21.2",
159
- "end_time_seconds": "1690585856"
160
  },
161
- "total": 2588.766835536,
162
  "count": 1,
163
- "self": 0.4954340930003127,
164
  "children": {
165
  "run_training.setup": {
166
- "total": 0.037516764000031344,
167
  "count": 1,
168
- "self": 0.037516764000031344
169
  },
170
  "TrainerController.start_learning": {
171
- "total": 2588.233884679,
172
  "count": 1,
173
- "self": 4.589962702969842,
174
  "children": {
175
  "TrainerController._reset_env": {
176
- "total": 5.886169492000022,
177
  "count": 1,
178
- "self": 5.886169492000022
179
  },
180
  "TrainerController.advance": {
181
- "total": 2577.6291935950303,
182
- "count": 233456,
183
- "self": 4.675258645137546,
184
  "children": {
185
  "env_step": {
186
- "total": 1982.4138683739782,
187
- "count": 233456,
188
- "self": 1680.5388024639528,
189
  "children": {
190
  "SubprocessEnvManager._take_step": {
191
- "total": 298.7917600520583,
192
- "count": 233456,
193
- "self": 17.207230754132752,
194
  "children": {
195
  "TorchPolicy.evaluate": {
196
- "total": 281.58452929792554,
197
- "count": 223014,
198
- "self": 281.58452929792554
199
  }
200
  }
201
  },
202
  "workers": {
203
- "total": 3.0833058579671615,
204
- "count": 233456,
205
  "self": 0.0,
206
  "children": {
207
  "worker_root": {
208
- "total": 2580.2034026209344,
209
- "count": 233456,
210
  "is_parallel": true,
211
- "self": 1206.656405075842,
212
  "children": {
213
  "run_training.setup": {
214
  "total": 0.0,
@@ -217,48 +217,48 @@
217
  "self": 0.0,
218
  "children": {
219
  "steps_from_proto": {
220
- "total": 0.001095160999966538,
221
  "count": 1,
222
  "is_parallel": true,
223
- "self": 0.00036009800004421777,
224
  "children": {
225
  "_process_rank_one_or_two_observation": {
226
- "total": 0.0007350629999223202,
227
  "count": 2,
228
  "is_parallel": true,
229
- "self": 0.0007350629999223202
230
  }
231
  }
232
  },
233
  "UnityEnvironment.step": {
234
- "total": 0.03181407299996408,
235
  "count": 1,
236
  "is_parallel": true,
237
- "self": 0.0003523400000062793,
238
  "children": {
239
  "UnityEnvironment._generate_step_input": {
240
- "total": 0.0002952959999902305,
241
  "count": 1,
242
  "is_parallel": true,
243
- "self": 0.0002952959999902305
244
  },
245
  "communicator.exchange": {
246
- "total": 0.030361092000021017,
247
  "count": 1,
248
  "is_parallel": true,
249
- "self": 0.030361092000021017
250
  },
251
  "steps_from_proto": {
252
- "total": 0.0008053449999465556,
253
  "count": 1,
254
  "is_parallel": true,
255
- "self": 0.00023592399998051405,
256
  "children": {
257
  "_process_rank_one_or_two_observation": {
258
- "total": 0.0005694209999660416,
259
  "count": 2,
260
  "is_parallel": true,
261
- "self": 0.0005694209999660416
262
  }
263
  }
264
  }
@@ -267,34 +267,34 @@
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
- "total": 1373.5469975450924,
271
- "count": 233455,
272
  "is_parallel": true,
273
- "self": 42.58592508306447,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
- "total": 85.86942661596044,
277
- "count": 233455,
278
  "is_parallel": true,
279
- "self": 85.86942661596044
280
  },
281
  "communicator.exchange": {
282
- "total": 1142.4717541311088,
283
- "count": 233455,
284
  "is_parallel": true,
285
- "self": 1142.4717541311088
286
  },
287
  "steps_from_proto": {
288
- "total": 102.6198917149585,
289
- "count": 233455,
290
  "is_parallel": true,
291
- "self": 37.3222376349658,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
- "total": 65.2976540799927,
295
- "count": 466910,
296
  "is_parallel": true,
297
- "self": 65.2976540799927
298
  }
299
  }
300
  }
@@ -307,31 +307,31 @@
307
  }
308
  },
309
  "trainer_advance": {
310
- "total": 590.5400665759146,
311
- "count": 233456,
312
- "self": 7.027893117021904,
313
  "children": {
314
  "process_trajectory": {
315
- "total": 148.17114591989144,
316
- "count": 233456,
317
- "self": 146.77920900089117,
318
  "children": {
319
  "RLTrainer._checkpoint": {
320
- "total": 1.3919369190002726,
321
- "count": 10,
322
- "self": 1.3919369190002726
323
  }
324
  }
325
  },
326
  "_update_policy": {
327
- "total": 435.3410275390013,
328
- "count": 97,
329
- "self": 373.34987713301365,
330
  "children": {
331
  "TorchPPOOptimizer.update": {
332
- "total": 61.99115040598764,
333
- "count": 2910,
334
- "self": 61.99115040598764
335
  }
336
  }
337
  }
@@ -340,19 +340,19 @@
340
  }
341
  },
342
  "trainer_threads": {
343
- "total": 9.7599968285067e-07,
344
  "count": 1,
345
- "self": 9.7599968285067e-07
346
  },
347
  "TrainerController._save_models": {
348
- "total": 0.12855791299989505,
349
  "count": 1,
350
- "self": 0.002049004000127752,
351
  "children": {
352
  "RLTrainer._checkpoint": {
353
- "total": 0.1265089089997673,
354
  "count": 1,
355
- "self": 0.1265089089997673
356
  }
357
  }
358
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "Huggy.Policy.Entropy.mean": {
5
+ "value": 1.4014936685562134,
6
+ "min": 1.4014936685562134,
7
+ "max": 1.4209308624267578,
8
+ "count": 20
9
  },
10
  "Huggy.Policy.Entropy.sum": {
11
+ "value": 69209.9609375,
12
+ "min": 68469.4375,
13
+ "max": 78726.71875,
14
+ "count": 20
15
  },
16
  "Huggy.Environment.EpisodeLength.mean": {
17
+ "value": 92.65543071161049,
18
+ "min": 92.16387337057728,
19
+ "max": 423.6386554621849,
20
+ "count": 20
21
  },
22
  "Huggy.Environment.EpisodeLength.sum": {
23
+ "value": 49478.0,
24
+ "min": 49166.0,
25
+ "max": 50413.0,
26
+ "count": 20
27
  },
28
  "Huggy.Step.mean": {
29
+ "value": 999997.0,
30
+ "min": 49936.0,
31
+ "max": 999997.0,
32
+ "count": 20
33
  },
34
  "Huggy.Step.sum": {
35
+ "value": 999997.0,
36
+ "min": 49936.0,
37
+ "max": 999997.0,
38
+ "count": 20
39
  },
40
  "Huggy.Policy.ExtrinsicValueEstimate.mean": {
41
+ "value": 2.316720485687256,
42
+ "min": 0.10337124019861221,
43
+ "max": 2.3928511142730713,
44
+ "count": 20
45
  },
46
  "Huggy.Policy.ExtrinsicValueEstimate.sum": {
47
+ "value": 1237.1287841796875,
48
+ "min": 12.197806358337402,
49
+ "max": 1237.1287841796875,
50
+ "count": 20
51
  },
52
  "Huggy.Environment.CumulativeReward.mean": {
53
+ "value": 3.696406583995855,
54
+ "min": 1.9392764144024606,
55
+ "max": 4.019030564286735,
56
+ "count": 20
57
  },
58
  "Huggy.Environment.CumulativeReward.sum": {
59
+ "value": 1973.8811158537865,
60
+ "min": 228.83461689949036,
61
+ "max": 2034.4308470487595,
62
+ "count": 20
63
  },
64
  "Huggy.Policy.ExtrinsicReward.mean": {
65
+ "value": 3.696406583995855,
66
+ "min": 1.9392764144024606,
67
+ "max": 4.019030564286735,
68
+ "count": 20
69
  },
70
  "Huggy.Policy.ExtrinsicReward.sum": {
71
+ "value": 1973.8811158537865,
72
+ "min": 228.83461689949036,
73
+ "max": 2034.4308470487595,
74
+ "count": 20
75
  },
76
  "Huggy.Losses.PolicyLoss.mean": {
77
+ "value": 0.019508854223143617,
78
+ "min": 0.013560492175020044,
79
+ "max": 0.019508854223143617,
80
+ "count": 20
81
  },
82
  "Huggy.Losses.PolicyLoss.sum": {
83
+ "value": 0.058526562669430855,
84
+ "min": 0.027120984350040088,
85
+ "max": 0.058526562669430855,
86
+ "count": 20
87
  },
88
  "Huggy.Losses.ValueLoss.mean": {
89
+ "value": 0.05377725619408819,
90
+ "min": 0.021555157378315926,
91
+ "max": 0.05377725619408819,
92
+ "count": 20
93
  },
94
  "Huggy.Losses.ValueLoss.sum": {
95
+ "value": 0.16133176858226458,
96
+ "min": 0.04311031475663185,
97
+ "max": 0.16133176858226458,
98
+ "count": 20
99
  },
100
  "Huggy.Policy.LearningRate.mean": {
101
+ "value": 8.697097100999997e-06,
102
+ "min": 8.697097100999997e-06,
103
+ "max": 0.00029056095314634997,
104
+ "count": 20
105
  },
106
  "Huggy.Policy.LearningRate.sum": {
107
+ "value": 2.6091291302999993e-05,
108
+ "min": 2.6091291302999993e-05,
109
+ "max": 0.0007875732374755999,
110
+ "count": 20
111
  },
112
  "Huggy.Policy.Epsilon.mean": {
113
+ "value": 0.10289900000000003,
114
+ "min": 0.10289900000000003,
115
+ "max": 0.19685365,
116
+ "count": 20
117
  },
118
  "Huggy.Policy.Epsilon.sum": {
119
+ "value": 0.3086970000000001,
120
+ "min": 0.21608970000000008,
121
+ "max": 0.5625244,
122
+ "count": 20
123
  },
124
  "Huggy.Policy.Beta.mean": {
125
+ "value": 0.0001546601,
126
+ "min": 0.0001546601,
127
+ "max": 0.004842997135,
128
+ "count": 20
129
  },
130
  "Huggy.Policy.Beta.sum": {
131
+ "value": 0.0004639803,
132
+ "min": 0.0004639803,
133
+ "max": 0.013129967559999997,
134
+ "count": 20
135
  },
136
  "Huggy.IsTraining.mean": {
137
  "value": 1.0,
138
  "min": 1.0,
139
  "max": 1.0,
140
+ "count": 20
141
  },
142
  "Huggy.IsTraining.sum": {
143
  "value": 1.0,
144
  "min": 1.0,
145
  "max": 1.0,
146
+ "count": 20
147
  }
148
  },
149
  "metadata": {
150
  "timer_format_version": "0.1.0",
151
+ "start_time_seconds": "1690712861",
152
  "python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
153
  "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy --no-graphics",
154
  "mlagents_version": "0.31.0.dev0",
 
156
  "communication_protocol_version": "1.5.0",
157
  "pytorch_version": "1.11.0+cu102",
158
  "numpy_version": "1.21.2",
159
+ "end_time_seconds": "1690714270"
160
  },
161
+ "total": 1409.180272759,
162
  "count": 1,
163
+ "self": 0.8060954229997606,
164
  "children": {
165
  "run_training.setup": {
166
+ "total": 0.03422981699998218,
167
  "count": 1,
168
+ "self": 0.03422981699998218
169
  },
170
  "TrainerController.start_learning": {
171
+ "total": 1408.3399475190001,
172
  "count": 1,
173
+ "self": 2.5385607980008444,
174
  "children": {
175
  "TrainerController._reset_env": {
176
+ "total": 5.25036774299997,
177
  "count": 1,
178
+ "self": 5.25036774299997
179
  },
180
  "TrainerController.advance": {
181
+ "total": 1399.6844948989992,
182
+ "count": 115315,
183
+ "self": 2.603209687017852,
184
  "children": {
185
  "env_step": {
186
+ "total": 1064.3650384289958,
187
+ "count": 115315,
188
+ "self": 888.7020123719685,
189
  "children": {
190
  "SubprocessEnvManager._take_step": {
191
+ "total": 174.00334019204223,
192
+ "count": 115315,
193
+ "self": 9.162774786042974,
194
  "children": {
195
  "TorchPolicy.evaluate": {
196
+ "total": 164.84056540599926,
197
+ "count": 111517,
198
+ "self": 164.84056540599926
199
  }
200
  }
201
  },
202
  "workers": {
203
+ "total": 1.6596858649851356,
204
+ "count": 115315,
205
  "self": 0.0,
206
  "children": {
207
  "worker_root": {
208
+ "total": 1402.507522992987,
209
+ "count": 115315,
210
  "is_parallel": true,
211
+ "self": 677.7311896820065,
212
  "children": {
213
  "run_training.setup": {
214
  "total": 0.0,
 
217
  "self": 0.0,
218
  "children": {
219
  "steps_from_proto": {
220
+ "total": 0.0009422530000051665,
221
  "count": 1,
222
  "is_parallel": true,
223
+ "self": 0.00028129599996873367,
224
  "children": {
225
  "_process_rank_one_or_two_observation": {
226
+ "total": 0.0006609570000364329,
227
  "count": 2,
228
  "is_parallel": true,
229
+ "self": 0.0006609570000364329
230
  }
231
  }
232
  },
233
  "UnityEnvironment.step": {
234
+ "total": 0.06981709199999386,
235
  "count": 1,
236
  "is_parallel": true,
237
+ "self": 0.0004136790000188739,
238
  "children": {
239
  "UnityEnvironment._generate_step_input": {
240
+ "total": 0.00025681500000018787,
241
  "count": 1,
242
  "is_parallel": true,
243
+ "self": 0.00025681500000018787
244
  },
245
  "communicator.exchange": {
246
+ "total": 0.06833572199997207,
247
  "count": 1,
248
  "is_parallel": true,
249
+ "self": 0.06833572199997207
250
  },
251
  "steps_from_proto": {
252
+ "total": 0.000810876000002736,
253
  "count": 1,
254
  "is_parallel": true,
255
+ "self": 0.00026542299997345253,
256
  "children": {
257
  "_process_rank_one_or_two_observation": {
258
+ "total": 0.0005454530000292834,
259
  "count": 2,
260
  "is_parallel": true,
261
+ "self": 0.0005454530000292834
262
  }
263
  }
264
  }
 
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
+ "total": 724.7763333109806,
271
+ "count": 115314,
272
  "is_parallel": true,
273
+ "self": 21.94055533093342,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
+ "total": 46.35788364499206,
277
+ "count": 115314,
278
  "is_parallel": true,
279
+ "self": 46.35788364499206
280
  },
281
  "communicator.exchange": {
282
+ "total": 603.4598228040127,
283
+ "count": 115314,
284
  "is_parallel": true,
285
+ "self": 603.4598228040127
286
  },
287
  "steps_from_proto": {
288
+ "total": 53.01807153104238,
289
+ "count": 115314,
290
  "is_parallel": true,
291
+ "self": 20.454085545991347,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
+ "total": 32.56398598505103,
295
+ "count": 230628,
296
  "is_parallel": true,
297
+ "self": 32.56398598505103
298
  }
299
  }
300
  }
 
307
  }
308
  },
309
  "trainer_advance": {
310
+ "total": 332.7162467829855,
311
+ "count": 115315,
312
+ "self": 3.6129976739747462,
313
  "children": {
314
  "process_trajectory": {
315
+ "total": 75.81877049801085,
316
+ "count": 115315,
317
+ "self": 74.37130274901085,
318
  "children": {
319
  "RLTrainer._checkpoint": {
320
+ "total": 1.4474677489999976,
321
+ "count": 2,
322
+ "self": 1.4474677489999976
323
  }
324
  }
325
  },
326
  "_update_policy": {
327
+ "total": 253.28447861099988,
328
+ "count": 48,
329
+ "self": 185.84675691799885,
330
  "children": {
331
  "TorchPPOOptimizer.update": {
332
+ "total": 67.43772169300104,
333
+ "count": 1440,
334
+ "self": 67.43772169300104
335
  }
336
  }
337
  }
 
340
  }
341
  },
342
  "trainer_threads": {
343
+ "total": 1.4690001535200281e-06,
344
  "count": 1,
345
+ "self": 1.4690001535200281e-06
346
  },
347
  "TrainerController._save_models": {
348
+ "total": 0.8665226099999472,
349
  "count": 1,
350
+ "self": 0.020756390999849827,
351
  "children": {
352
  "RLTrainer._checkpoint": {
353
+ "total": 0.8457662190000974,
354
  "count": 1,
355
+ "self": 0.8457662190000974
356
  }
357
  }
358
  }
run_logs/training_status.json CHANGED
@@ -2,112 +2,40 @@
2
  "Huggy": {
3
  "checkpoints": [
4
  {
5
- "steps": 199614,
6
- "file_path": "results/Huggy/Huggy/Huggy-199614.onnx",
7
- "reward": 3.4442040760125687,
8
- "creation_time": 1690583517.927822,
9
  "auxillary_file_paths": [
10
- "results/Huggy/Huggy/Huggy-199614.pt"
11
  ]
12
  },
13
  {
14
- "steps": 399852,
15
- "file_path": "results/Huggy/Huggy/Huggy-399852.onnx",
16
- "reward": 4.124925029479851,
17
- "creation_time": 1690583779.96298,
18
  "auxillary_file_paths": [
19
- "results/Huggy/Huggy/Huggy-399852.pt"
20
  ]
21
  },
22
  {
23
- "steps": 599966,
24
- "file_path": "results/Huggy/Huggy/Huggy-599966.onnx",
25
- "reward": 3.802982736717571,
26
- "creation_time": 1690584026.791236,
27
  "auxillary_file_paths": [
28
- "results/Huggy/Huggy/Huggy-599966.pt"
29
- ]
30
- },
31
- {
32
- "steps": 799966,
33
- "file_path": "results/Huggy/Huggy/Huggy-799966.onnx",
34
- "reward": 3.8715678082271054,
35
- "creation_time": 1690584274.5079417,
36
- "auxillary_file_paths": [
37
- "results/Huggy/Huggy/Huggy-799966.pt"
38
- ]
39
- },
40
- {
41
- "steps": 999981,
42
- "file_path": "results/Huggy/Huggy/Huggy-999981.onnx",
43
- "reward": 3.677767977204626,
44
- "creation_time": 1690584525.3432307,
45
- "auxillary_file_paths": [
46
- "results/Huggy/Huggy/Huggy-999981.pt"
47
- ]
48
- },
49
- {
50
- "steps": 1199405,
51
- "file_path": "results/Huggy/Huggy/Huggy-1199405.onnx",
52
- "reward": 3.9628135824716217,
53
- "creation_time": 1690584776.3798282,
54
- "auxillary_file_paths": [
55
- "results/Huggy/Huggy/Huggy-1199405.pt"
56
- ]
57
- },
58
- {
59
- "steps": 1399960,
60
- "file_path": "results/Huggy/Huggy/Huggy-1399960.onnx",
61
- "reward": 3.474997438233474,
62
- "creation_time": 1690585040.608361,
63
- "auxillary_file_paths": [
64
- "results/Huggy/Huggy/Huggy-1399960.pt"
65
- ]
66
- },
67
- {
68
- "steps": 1599957,
69
- "file_path": "results/Huggy/Huggy/Huggy-1599957.onnx",
70
- "reward": 3.6568161831345667,
71
- "creation_time": 1690585309.406654,
72
- "auxillary_file_paths": [
73
- "results/Huggy/Huggy/Huggy-1599957.pt"
74
- ]
75
- },
76
- {
77
- "steps": 1799916,
78
- "file_path": "results/Huggy/Huggy/Huggy-1799916.onnx",
79
- "reward": 3.668588197638846,
80
- "creation_time": 1690585582.6251736,
81
- "auxillary_file_paths": [
82
- "results/Huggy/Huggy/Huggy-1799916.pt"
83
- ]
84
- },
85
- {
86
- "steps": 1999998,
87
- "file_path": "results/Huggy/Huggy/Huggy-1999998.onnx",
88
- "reward": 3.6643659095374908,
89
- "creation_time": 1690585855.813841,
90
- "auxillary_file_paths": [
91
- "results/Huggy/Huggy/Huggy-1999998.pt"
92
- ]
93
- },
94
- {
95
- "steps": 2000045,
96
- "file_path": "results/Huggy/Huggy/Huggy-2000045.onnx",
97
- "reward": 3.6713722276687624,
98
- "creation_time": 1690585855.9445167,
99
- "auxillary_file_paths": [
100
- "results/Huggy/Huggy/Huggy-2000045.pt"
101
  ]
102
  }
103
  ],
104
  "final_checkpoint": {
105
- "steps": 2000045,
106
  "file_path": "results/Huggy/Huggy.onnx",
107
- "reward": 3.6713722276687624,
108
- "creation_time": 1690585855.9445167,
109
  "auxillary_file_paths": [
110
- "results/Huggy/Huggy/Huggy-2000045.pt"
111
  ]
112
  }
113
  },
 
2
  "Huggy": {
3
  "checkpoints": [
4
  {
5
+ "steps": 499998,
6
+ "file_path": "results/Huggy/Huggy/Huggy-499998.onnx",
7
+ "reward": 4.570572445025811,
8
+ "creation_time": 1690713559.0714483,
9
  "auxillary_file_paths": [
10
+ "results/Huggy/Huggy/Huggy-499998.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 999997,
15
+ "file_path": "results/Huggy/Huggy/Huggy-999997.onnx",
16
+ "reward": 3.6014482759414834,
17
+ "creation_time": 1690714268.6120915,
18
  "auxillary_file_paths": [
19
+ "results/Huggy/Huggy/Huggy-999997.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 1000048,
24
+ "file_path": "results/Huggy/Huggy/Huggy-1000048.onnx",
25
+ "reward": 3.589829779926099,
26
+ "creation_time": 1690714269.464684,
27
  "auxillary_file_paths": [
28
+ "results/Huggy/Huggy/Huggy-1000048.pt"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
29
  ]
30
  }
31
  ],
32
  "final_checkpoint": {
33
+ "steps": 1000048,
34
  "file_path": "results/Huggy/Huggy.onnx",
35
+ "reward": 3.589829779926099,
36
+ "creation_time": 1690714269.464684,
37
  "auxillary_file_paths": [
38
+ "results/Huggy/Huggy/Huggy-1000048.pt"
39
  ]
40
  }
41
  },