Caesarrr commited on
Commit
ba3f5c4
·
verified ·
1 Parent(s): 998eea8

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -48,3 +48,4 @@ factor_sweeps/flappy/observation_stride/train/factor_sweep:flappy:observation_st
48
  factor_sweeps/flappy/observation_stride/train/factor_sweep:flappy:observation_stride:fixed_l2:fs4:obs15:stride2:seed12/episode_metrics.jsonl filter=lfs diff=lfs merge=lfs -text
49
  factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed10/episode_metrics.jsonl filter=lfs diff=lfs merge=lfs -text
50
  factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed11/episode_metrics.jsonl filter=lfs diff=lfs merge=lfs -text
 
 
48
  factor_sweeps/flappy/observation_stride/train/factor_sweep:flappy:observation_stride:fixed_l2:fs4:obs15:stride2:seed12/episode_metrics.jsonl filter=lfs diff=lfs merge=lfs -text
49
  factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed10/episode_metrics.jsonl filter=lfs diff=lfs merge=lfs -text
50
  factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed11/episode_metrics.jsonl filter=lfs diff=lfs merge=lfs -text
51
+ factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/episode_metrics.jsonl filter=lfs diff=lfs merge=lfs -text
factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/checkpoint_p0/best_000048840_25034752_reward_2156.198.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:881450007cfa014c9d46bbf821d36d207882ccbc3953672f02e06298a21abe2a
3
+ size 22210361
factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/checkpoint_p0/checkpoint_000021152_10846208.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1401620a4db490f3e59bb22706fd389deb0273a8e6ea08d7e14cdf932072aba
3
+ size 22210721
factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/checkpoint_p0/checkpoint_000042720_21889024.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f62bc7349347379d1899dafd39c31f488b9037411282d6f3a0d23b54890f297
3
+ size 22210721
factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/checkpoint_p0/checkpoint_000048840_25034752.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e80d5d6d07bced0410b185491cb4288b7fd087a616e3372f6beca2a24e0a8e6
3
+ size 22210721
factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/config.json ADDED
@@ -0,0 +1,266 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "help": false,
3
+ "algo": "APPO",
4
+ "env": "latency_flappy",
5
+ "experiment": "flappy_frame_stack_fixed_l2_fs5_seed12",
6
+ "train_dir": "results/checkpoints_factor_sweeps/flappy/context_window",
7
+ "restart_behavior": "resume",
8
+ "device": "gpu",
9
+ "seed": 12,
10
+ "num_policies": 1,
11
+ "async_rl": true,
12
+ "serial_mode": false,
13
+ "batched_sampling": true,
14
+ "num_batches_to_accumulate": 2,
15
+ "worker_num_splits": 1,
16
+ "policy_workers_per_policy": 1,
17
+ "max_policy_lag": 400,
18
+ "num_workers": 2,
19
+ "num_envs_per_worker": 1,
20
+ "batch_size": 4096,
21
+ "num_batches_per_epoch": 8,
22
+ "num_epochs": 8,
23
+ "rollout": 128,
24
+ "recurrence": 1,
25
+ "shuffle_minibatches": false,
26
+ "gamma": 0.99,
27
+ "reward_scale": 1.0,
28
+ "reward_clip": 1000.0,
29
+ "value_bootstrap": false,
30
+ "normalize_returns": true,
31
+ "exploration_loss_coeff": 0.003,
32
+ "value_loss_coeff": 0.5,
33
+ "kl_loss_coeff": 0.0,
34
+ "exploration_loss": "entropy",
35
+ "gae_lambda": 0.95,
36
+ "ppo_clip_ratio": 0.1,
37
+ "ppo_clip_value": 0.2,
38
+ "with_vtrace": false,
39
+ "vtrace_rho": 1.0,
40
+ "vtrace_c": 1.0,
41
+ "optimizer": "adam",
42
+ "adam_eps": 1e-05,
43
+ "adam_beta1": 0.9,
44
+ "adam_beta2": 0.999,
45
+ "max_grad_norm": 0.5,
46
+ "learning_rate": 0.00025,
47
+ "lr_schedule": "linear_decay",
48
+ "lr_schedule_kl_threshold": 0.008,
49
+ "lr_adaptive_min": 1e-06,
50
+ "lr_adaptive_max": 0.01,
51
+ "obs_subtract_mean": 0.0,
52
+ "obs_scale": 255.0,
53
+ "normalize_input": true,
54
+ "normalize_input_keys": null,
55
+ "decorrelate_experience_max_seconds": 0,
56
+ "decorrelate_envs_on_one_worker": true,
57
+ "actor_worker_gpus": [
58
+ 0
59
+ ],
60
+ "set_workers_cpu_affinity": true,
61
+ "force_envs_single_thread": false,
62
+ "default_niceness": 0,
63
+ "log_to_file": true,
64
+ "experiment_summaries_interval": 1,
65
+ "flush_summaries_interval": 30,
66
+ "stats_avg": 100,
67
+ "summaries_use_frameskip": true,
68
+ "heartbeat_interval": 20,
69
+ "heartbeat_reporting_interval": 180,
70
+ "train_for_env_steps": 25000000,
71
+ "train_for_seconds": 10000000000,
72
+ "save_every_sec": 600,
73
+ "keep_checkpoints": 5,
74
+ "load_checkpoint_kind": "latest",
75
+ "save_milestones_sec": -1,
76
+ "save_best_every_sec": 5,
77
+ "save_best_metric": "reward",
78
+ "save_best_after": 100000,
79
+ "benchmark": false,
80
+ "encoder_mlp_layers": [
81
+ 512,
82
+ 512
83
+ ],
84
+ "encoder_conv_architecture": "convnet_atari",
85
+ "encoder_conv_mlp_layers": [
86
+ 512
87
+ ],
88
+ "use_rnn": false,
89
+ "rnn_size": 512,
90
+ "rnn_type": "gru",
91
+ "rnn_num_layers": 1,
92
+ "decoder_mlp_layers": [],
93
+ "nonlinearity": "elu",
94
+ "policy_initialization": "orthogonal",
95
+ "policy_init_gain": 1.0,
96
+ "actor_critic_share_weights": true,
97
+ "adaptive_stddev": true,
98
+ "continuous_tanh_scale": 0.0,
99
+ "initial_stddev": 1.0,
100
+ "use_env_info_cache": false,
101
+ "env_gpu_actions": true,
102
+ "env_gpu_observations": true,
103
+ "env_frameskip": 1,
104
+ "env_framestack": 1,
105
+ "pixel_format": "CHW",
106
+ "use_record_episode_statistics": false,
107
+ "with_wandb": true,
108
+ "wandb_user": null,
109
+ "wandb_project": "latency-sensitive-bench",
110
+ "wandb_group": "flappy-fs5-fixed_l2",
111
+ "wandb_job_type": "sample_factory",
112
+ "wandb_tags": [
113
+ "factor_sweep",
114
+ "flappy",
115
+ "frame_stack",
116
+ "fixed",
117
+ "fixed_l2",
118
+ "fs5",
119
+ "seed12"
120
+ ],
121
+ "with_pbt": false,
122
+ "pbt_mix_policies_in_one_env": true,
123
+ "pbt_period_env_steps": 5000000,
124
+ "pbt_start_mutation": 20000000,
125
+ "pbt_replace_fraction": 0.3,
126
+ "pbt_mutation_rate": 0.15,
127
+ "pbt_replace_reward_gap": 0.1,
128
+ "pbt_replace_reward_gap_absolute": 1e-06,
129
+ "pbt_optimize_gamma": false,
130
+ "pbt_target_objective": "true_objective",
131
+ "pbt_perturb_min": 1.1,
132
+ "pbt_perturb_max": 1.5,
133
+ "gym_id": "FlappyBird-v0",
134
+ "env_fps": 30.0,
135
+ "obs_fps": 30.0,
136
+ "use_lidar": false,
137
+ "normalize_obs": true,
138
+ "audio_on": false,
139
+ "screen_size": "",
140
+ "obs_resize": "84,84",
141
+ "use_gpu_render": true,
142
+ "simulator": "gpu",
143
+ "gpu_render_device": "auto",
144
+ "gpu_render_batch_size": 128,
145
+ "gpu_render_profile": false,
146
+ "gpu_render_profile_interval": 200,
147
+ "pipe_gap": 100,
148
+ "bird_color": "yellow",
149
+ "pipe_color": "green",
150
+ "background": "day",
151
+ "score_limit": -1,
152
+ "frame_stack": 5,
153
+ "debug": false,
154
+ "debug_timelimit_diagnostics": false,
155
+ "max_episode_steps": 0,
156
+ "mode": "train",
157
+ "latency_type": "fixed",
158
+ "fixed_latency_ms": 66.66666666666667,
159
+ "mean_latency_ms": null,
160
+ "std_latency_ms": null,
161
+ "min_latency_ms": null,
162
+ "max_latency_ms": null,
163
+ "latency_seed": null,
164
+ "add_latency_info": false,
165
+ "max_pending_actions": null,
166
+ "hold_policy": "one_frame_then_noop",
167
+ "ordering_policy": "latest_ready",
168
+ "eval_episodes": 100,
169
+ "eval_parallel_envs": 100,
170
+ "eval_latency_raw_frame_values": "0,1,2,3,4,5",
171
+ "eval_max_steps": 3600,
172
+ "eval_deterministic": true,
173
+ "eval_raw_reward": false,
174
+ "episode_metrics_path": "results/checkpoints_factor_sweeps/flappy/context_window/flappy_frame_stack_fixed_l2_fs5_seed12/episode_metrics.jsonl",
175
+ "command_line": "--mode train --algo APPO --env latency_flappy --experiment flappy_frame_stack_fixed_l2_fs5_seed12 --train_dir results/checkpoints_factor_sweeps/flappy/context_window --restart_behavior resume --device gpu --actor_worker_gpus 0 --env_gpu_observations True --env_gpu_actions True --gpu-render-batch-size 128 --seed 12 --episode_metrics_path results/checkpoints_factor_sweeps/flappy/context_window/flappy_frame_stack_fixed_l2_fs5_seed12/episode_metrics.jsonl --train_for_env_steps 25000000 --num_workers 2 --num_envs_per_worker 1 --num_policies 1 --batch_size 4096 --rollout 128 --recurrence 1 --num_epochs 8 --num_batches_per_epoch 8 --worker_num_splits 1 --max_policy_lag 400 --learning_rate 0.00025 --gamma 0.99 --gae_lambda 0.95 --ppo_clip_ratio 0.1 --ppo_clip_value 0.2 --value_loss_coeff 0.5 --max_grad_norm 0.5 --save_every_sec 600 --keep_checkpoints 5 --stats_avg 100 --experiment_summaries_interval 1 --batched_sampling True --async_rl True --use_rnn False --normalize_returns True --normalize_input True --latency-type fixed --fixed-latency-ms 66.66666666666667 --add-latency-info False --eval-episodes 100 --eval-parallel-envs 100 --eval-max-steps 3600 --eval-deterministic True --with_wandb True --wandb_project latency-sensitive-bench --wandb_group flappy-fs5-fixed_l2 --wandb_job_type sample_factory --wandb_tags factor_sweep flappy frame_stack fixed fixed_l2 fs5 seed12 --gym_id FlappyBird-v0 --env-fps 30 --obs-fps 30.0 --use_lidar False --normalize_obs True --audio_on False --obs_resize 84,84 --use-gpu-render True --simulator gpu --gpu-render-device auto --gpu-render-profile False --gpu-render-profile-interval 200 --pipe_gap 100 --bird_color yellow --pipe_color green --background day --frame_stack 5 --debug False --debug-timelimit-diagnostics False --hold-policy one_frame_then_noop --ordering-policy latest_ready",
176
+ "cli_args": {
177
+ "algo": "APPO",
178
+ "env": "latency_flappy",
179
+ "experiment": "flappy_frame_stack_fixed_l2_fs5_seed12",
180
+ "train_dir": "results/checkpoints_factor_sweeps/flappy/context_window",
181
+ "restart_behavior": "resume",
182
+ "device": "gpu",
183
+ "seed": 12,
184
+ "num_policies": 1,
185
+ "async_rl": true,
186
+ "batched_sampling": true,
187
+ "worker_num_splits": 1,
188
+ "max_policy_lag": 400,
189
+ "num_workers": 2,
190
+ "num_envs_per_worker": 1,
191
+ "batch_size": 4096,
192
+ "num_batches_per_epoch": 8,
193
+ "num_epochs": 8,
194
+ "rollout": 128,
195
+ "recurrence": 1,
196
+ "gamma": 0.99,
197
+ "normalize_returns": true,
198
+ "value_loss_coeff": 0.5,
199
+ "gae_lambda": 0.95,
200
+ "ppo_clip_ratio": 0.1,
201
+ "ppo_clip_value": 0.2,
202
+ "max_grad_norm": 0.5,
203
+ "learning_rate": 0.00025,
204
+ "normalize_input": true,
205
+ "actor_worker_gpus": [
206
+ 0
207
+ ],
208
+ "experiment_summaries_interval": 1,
209
+ "stats_avg": 100,
210
+ "train_for_env_steps": 25000000,
211
+ "save_every_sec": 600,
212
+ "keep_checkpoints": 5,
213
+ "use_rnn": false,
214
+ "env_gpu_actions": true,
215
+ "env_gpu_observations": true,
216
+ "with_wandb": true,
217
+ "wandb_project": "latency-sensitive-bench",
218
+ "wandb_group": "flappy-fs5-fixed_l2",
219
+ "wandb_job_type": "sample_factory",
220
+ "wandb_tags": [
221
+ "factor_sweep",
222
+ "flappy",
223
+ "frame_stack",
224
+ "fixed",
225
+ "fixed_l2",
226
+ "fs5",
227
+ "seed12"
228
+ ],
229
+ "gym_id": "FlappyBird-v0",
230
+ "env_fps": 30.0,
231
+ "obs_fps": 30.0,
232
+ "use_lidar": false,
233
+ "normalize_obs": true,
234
+ "audio_on": false,
235
+ "obs_resize": "84,84",
236
+ "use_gpu_render": true,
237
+ "simulator": "gpu",
238
+ "gpu_render_device": "auto",
239
+ "gpu_render_batch_size": 128,
240
+ "gpu_render_profile": false,
241
+ "gpu_render_profile_interval": 200,
242
+ "pipe_gap": 100,
243
+ "bird_color": "yellow",
244
+ "pipe_color": "green",
245
+ "background": "day",
246
+ "frame_stack": 5,
247
+ "debug": false,
248
+ "debug_timelimit_diagnostics": false,
249
+ "mode": "train",
250
+ "latency_type": "fixed",
251
+ "fixed_latency_ms": 66.66666666666667,
252
+ "add_latency_info": false,
253
+ "hold_policy": "one_frame_then_noop",
254
+ "ordering_policy": "latest_ready",
255
+ "eval_episodes": 100,
256
+ "eval_parallel_envs": 100,
257
+ "eval_max_steps": 3600,
258
+ "eval_deterministic": true,
259
+ "episode_metrics_path": "results/checkpoints_factor_sweeps/flappy/context_window/flappy_frame_stack_fixed_l2_fs5_seed12/episode_metrics.jsonl"
260
+ },
261
+ "git_hash": "284fe8ace24f0e8a40c03c5b559969abd7caeb29",
262
+ "git_repo_name": "git@github.com:ZihanWang314/latency-sensitive-bench.git",
263
+ "eval_env_frameskip": 1,
264
+ "output_dir": "outputs/factor_sweeps/flappy/context_window/train/frame_stack/fixed_l2/fs5/seed_12",
265
+ "wandb_unique_id": "flappy-fs5-fixed_l2-s12"
266
+ }
factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/episode_metrics.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b56af456ed3e58ad4937015279dbdba3f55d22410fafdc5225a0018df74f34a5
3
+ size 20384405
factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/git.diff ADDED
File without changes
factor_sweeps/flappy/context_window/train/factor_sweep:flappy:frame_stack:fixed_l2:fs5:obs30:stride1:seed12/sf_log.txt ADDED
The diff for this file is too large to render. See raw diff