Caesarrr commited on
Commit
442f9cd
·
verified ·
1 Parent(s): 86d3f82

Upload folder using huggingface_hub

Browse files
Files changed (10) hide show
  1. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/best_000046560_23838720_reward_13124.950.pth +3 -0
  2. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000017536_8978432.pth +3 -0
  3. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000031936_16351232.pth +3 -0
  4. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000047232_24182784.pth +3 -0
  5. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000048864_25018368.pth +3 -0
  6. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000048880_25026560.pth +3 -0
  7. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/config.json +255 -0
  8. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/episode_metrics.jsonl +0 -0
  9. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/git.diff +7 -0
  10. factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/sf_log.txt +0 -0
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/best_000046560_23838720_reward_13124.950.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be7e25bdad1aa41adf17f899857031c00aee8744f5afc73c59df4f80ea9278bd
3
+ size 21547577
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000017536_8978432.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3affc2df3f7aa8ca07e12f80de3e8a2542ff263869aed9e58609f8b0e551eba8
3
+ size 21547937
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000031936_16351232.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c92ae35f57b6f7dd383c736f22951c5fa3d4059037dbe4ab7a5e86603801329
3
+ size 21547937
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000047232_24182784.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7125d6062812f9733619234cd0d671a77ed899eddc8d6a0d45c623ddd80b6dc7
3
+ size 21547937
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000048864_25018368.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d99b895f0a278208ec49f47db2747b484dedaf98de87ee6e864fc53743b472b5
3
+ size 21547937
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/checkpoint_p0/checkpoint_000048880_25026560.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48ae89909b6589fd21baf75b115dbb3d76230ffa55b2b3692be325395d63f963
3
+ size 21547937
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/config.json ADDED
@@ -0,0 +1,255 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "help": false,
3
+ "algo": "APPO",
4
+ "env": "latency_demon_attack",
5
+ "experiment": "demon_attack_frame_stack_uniform_u2_6_fs10_seed14",
6
+ "train_dir": "results/checkpoints_factor_sweeps/demon_attack/context_window",
7
+ "restart_behavior": "resume",
8
+ "device": "gpu",
9
+ "seed": 14,
10
+ "num_policies": 1,
11
+ "async_rl": true,
12
+ "serial_mode": false,
13
+ "batched_sampling": true,
14
+ "num_batches_to_accumulate": 2,
15
+ "worker_num_splits": 1,
16
+ "policy_workers_per_policy": 1,
17
+ "max_policy_lag": 300,
18
+ "num_workers": 1,
19
+ "num_envs_per_worker": 1,
20
+ "batch_size": 1024,
21
+ "num_batches_per_epoch": 8,
22
+ "num_epochs": 2,
23
+ "rollout": 64,
24
+ "recurrence": 32,
25
+ "shuffle_minibatches": false,
26
+ "gamma": 0.99,
27
+ "reward_scale": 1.0,
28
+ "reward_clip": 1000.0,
29
+ "value_bootstrap": false,
30
+ "normalize_returns": true,
31
+ "exploration_loss_coeff": 0.003,
32
+ "value_loss_coeff": 0.5,
33
+ "kl_loss_coeff": 0.0,
34
+ "exploration_loss": "entropy",
35
+ "gae_lambda": 0.95,
36
+ "ppo_clip_ratio": 0.1,
37
+ "ppo_clip_value": 0.2,
38
+ "with_vtrace": false,
39
+ "vtrace_rho": 1.0,
40
+ "vtrace_c": 1.0,
41
+ "optimizer": "adam",
42
+ "adam_eps": 1e-05,
43
+ "adam_beta1": 0.9,
44
+ "adam_beta2": 0.999,
45
+ "max_grad_norm": 0.0,
46
+ "learning_rate": 0.000303,
47
+ "lr_schedule": "linear_decay",
48
+ "lr_schedule_kl_threshold": 0.008,
49
+ "lr_adaptive_min": 1e-06,
50
+ "lr_adaptive_max": 0.01,
51
+ "obs_subtract_mean": 0.0,
52
+ "obs_scale": 255.0,
53
+ "normalize_input": true,
54
+ "normalize_input_keys": null,
55
+ "decorrelate_experience_max_seconds": 0,
56
+ "decorrelate_envs_on_one_worker": true,
57
+ "actor_worker_gpus": [
58
+ 0
59
+ ],
60
+ "set_workers_cpu_affinity": true,
61
+ "force_envs_single_thread": false,
62
+ "default_niceness": 0,
63
+ "log_to_file": true,
64
+ "experiment_summaries_interval": 1,
65
+ "flush_summaries_interval": 30,
66
+ "stats_avg": 100,
67
+ "summaries_use_frameskip": true,
68
+ "heartbeat_interval": 20,
69
+ "heartbeat_reporting_interval": 180,
70
+ "train_for_env_steps": 25000000,
71
+ "train_for_seconds": 10000000000,
72
+ "save_every_sec": 600,
73
+ "keep_checkpoints": 5,
74
+ "load_checkpoint_kind": "latest",
75
+ "save_milestones_sec": -1,
76
+ "save_best_every_sec": 5,
77
+ "save_best_metric": "reward",
78
+ "save_best_after": 100000,
79
+ "benchmark": false,
80
+ "encoder_mlp_layers": [
81
+ 512,
82
+ 512
83
+ ],
84
+ "encoder_conv_architecture": "convnet_atari",
85
+ "encoder_conv_mlp_layers": [
86
+ 512
87
+ ],
88
+ "use_rnn": false,
89
+ "rnn_size": 512,
90
+ "rnn_type": "gru",
91
+ "rnn_num_layers": 1,
92
+ "decoder_mlp_layers": [],
93
+ "nonlinearity": "elu",
94
+ "policy_initialization": "orthogonal",
95
+ "policy_init_gain": 1.0,
96
+ "actor_critic_share_weights": true,
97
+ "adaptive_stddev": true,
98
+ "continuous_tanh_scale": 0.0,
99
+ "initial_stddev": 1.0,
100
+ "use_env_info_cache": false,
101
+ "env_gpu_actions": true,
102
+ "env_gpu_observations": true,
103
+ "env_frameskip": 1,
104
+ "env_framestack": 1,
105
+ "pixel_format": "CHW",
106
+ "use_record_episode_statistics": false,
107
+ "with_wandb": true,
108
+ "wandb_user": null,
109
+ "wandb_project": "latency-sensitive-bench",
110
+ "wandb_group": "demon-attack-fs10-uniform_u2_6",
111
+ "wandb_job_type": "sample_factory",
112
+ "wandb_tags": [
113
+ "factor_sweep",
114
+ "demon-attack",
115
+ "frame_stack",
116
+ "uniform",
117
+ "uniform_u2_6",
118
+ "fs10",
119
+ "seed14"
120
+ ],
121
+ "with_pbt": false,
122
+ "pbt_mix_policies_in_one_env": true,
123
+ "pbt_period_env_steps": 5000000,
124
+ "pbt_start_mutation": 20000000,
125
+ "pbt_replace_fraction": 0.3,
126
+ "pbt_mutation_rate": 0.15,
127
+ "pbt_replace_reward_gap": 0.1,
128
+ "pbt_replace_reward_gap_absolute": 1e-06,
129
+ "pbt_optimize_gamma": false,
130
+ "pbt_target_objective": "true_objective",
131
+ "pbt_perturb_min": 1.1,
132
+ "pbt_perturb_max": 1.5,
133
+ "env_id": "ALE/DemonAttack-v5",
134
+ "env_fps": 60.0,
135
+ "obs_fps": 15.0,
136
+ "screen_size": 84,
137
+ "noop_max": 30,
138
+ "frame_stack": 10,
139
+ "terminal_on_life_loss": true,
140
+ "clip_reward": true,
141
+ "repeat_action_probability": 0.0,
142
+ "full_action_space": false,
143
+ "max_episode_steps": 25000,
144
+ "simulator": "gpu",
145
+ "gpu_env_device": "auto",
146
+ "gpu_env_batch_size": 512,
147
+ "export_env_raw_rgb_frames": false,
148
+ "mode": "train",
149
+ "latency_type": "uniform_distribution",
150
+ "fixed_latency_ms": null,
151
+ "mean_latency_ms": null,
152
+ "std_latency_ms": null,
153
+ "min_latency_ms": 33.333333333333336,
154
+ "max_latency_ms": 100.0,
155
+ "latency_seed": 14,
156
+ "add_latency_info": false,
157
+ "max_pending_actions": null,
158
+ "hold_policy": "hold",
159
+ "ordering_policy": "latest_ready",
160
+ "eval_episodes": 100,
161
+ "eval_parallel_envs": 100,
162
+ "eval_latency_raw_frame_values": "0,1,2,3,4,5",
163
+ "eval_max_steps": 36000,
164
+ "eval_deterministic": true,
165
+ "eval_raw_reward": true,
166
+ "episode_metrics_path": "results/checkpoints_factor_sweeps/demon_attack/context_window/demon_attack_frame_stack_uniform_u2_6_fs10_seed14/episode_metrics.jsonl",
167
+ "command_line": "--mode train --algo APPO --env latency_demon_attack --experiment demon_attack_frame_stack_uniform_u2_6_fs10_seed14 --train_dir results/checkpoints_factor_sweeps/demon_attack/context_window --restart_behavior resume --device gpu --actor_worker_gpus 0 --env_gpu_observations True --env_gpu_actions True --gpu-env-batch-size 512 --seed 14 --episode_metrics_path results/checkpoints_factor_sweeps/demon_attack/context_window/demon_attack_frame_stack_uniform_u2_6_fs10_seed14/episode_metrics.jsonl --train_for_env_steps 25000000 --num_workers 1 --num_envs_per_worker 1 --num_policies 1 --batch_size 1024 --rollout 64 --recurrence 32 --num_epochs 2 --num_batches_per_epoch 8 --worker_num_splits 1 --max_policy_lag 300 --learning_rate 0.000303 --gamma 0.99 --gae_lambda 0.95 --ppo_clip_ratio 0.1 --ppo_clip_value 0.2 --value_loss_coeff 0.5 --max_grad_norm 0.0 --save_every_sec 600 --keep_checkpoints 5 --stats_avg 100 --experiment_summaries_interval 1 --batched_sampling True --async_rl True --batched_sampling True --use_rnn False --normalize_returns True --normalize_input True --latency-type uniform_distribution --min-latency-ms 33.333333333333336 --max-latency-ms 100.0 --latency-seed 14 --add-latency-info False --eval-episodes 100 --eval-parallel-envs 100 --eval-max-steps 36000 --eval-deterministic True --eval-raw-reward --with_wandb True --wandb_project latency-sensitive-bench --wandb_group demon-attack-fs10-uniform_u2_6 --wandb_job_type sample_factory --wandb_tags factor_sweep demon-attack frame_stack uniform uniform_u2_6 fs10 seed14 --env_id ALE/DemonAttack-v5 --env-fps 60 --obs-fps 15.0 --screen_size 84 --noop_max 30 --frame_stack 10 --terminal_on_life_loss True --clip_reward True --repeat_action_probability 0.0 --full_action_space False --max_episode_steps 25000 --simulator gpu --gpu-env-device auto --hold-policy hold --ordering-policy latest_ready",
168
+ "cli_args": {
169
+ "algo": "APPO",
170
+ "env": "latency_demon_attack",
171
+ "experiment": "demon_attack_frame_stack_uniform_u2_6_fs10_seed14",
172
+ "train_dir": "results/checkpoints_factor_sweeps/demon_attack/context_window",
173
+ "restart_behavior": "resume",
174
+ "device": "gpu",
175
+ "seed": 14,
176
+ "num_policies": 1,
177
+ "async_rl": true,
178
+ "batched_sampling": true,
179
+ "worker_num_splits": 1,
180
+ "max_policy_lag": 300,
181
+ "num_workers": 1,
182
+ "num_envs_per_worker": 1,
183
+ "batch_size": 1024,
184
+ "num_batches_per_epoch": 8,
185
+ "num_epochs": 2,
186
+ "rollout": 64,
187
+ "recurrence": 32,
188
+ "gamma": 0.99,
189
+ "normalize_returns": true,
190
+ "value_loss_coeff": 0.5,
191
+ "gae_lambda": 0.95,
192
+ "ppo_clip_ratio": 0.1,
193
+ "ppo_clip_value": 0.2,
194
+ "max_grad_norm": 0.0,
195
+ "learning_rate": 0.000303,
196
+ "normalize_input": true,
197
+ "actor_worker_gpus": [
198
+ 0
199
+ ],
200
+ "experiment_summaries_interval": 1,
201
+ "stats_avg": 100,
202
+ "train_for_env_steps": 25000000,
203
+ "save_every_sec": 600,
204
+ "keep_checkpoints": 5,
205
+ "use_rnn": false,
206
+ "env_gpu_actions": true,
207
+ "env_gpu_observations": true,
208
+ "with_wandb": true,
209
+ "wandb_project": "latency-sensitive-bench",
210
+ "wandb_group": "demon-attack-fs10-uniform_u2_6",
211
+ "wandb_job_type": "sample_factory",
212
+ "wandb_tags": [
213
+ "factor_sweep",
214
+ "demon-attack",
215
+ "frame_stack",
216
+ "uniform",
217
+ "uniform_u2_6",
218
+ "fs10",
219
+ "seed14"
220
+ ],
221
+ "env_id": "ALE/DemonAttack-v5",
222
+ "env_fps": 60.0,
223
+ "obs_fps": 15.0,
224
+ "screen_size": 84,
225
+ "noop_max": 30,
226
+ "frame_stack": 10,
227
+ "terminal_on_life_loss": true,
228
+ "clip_reward": true,
229
+ "repeat_action_probability": 0.0,
230
+ "full_action_space": false,
231
+ "max_episode_steps": 25000,
232
+ "simulator": "gpu",
233
+ "gpu_env_device": "auto",
234
+ "gpu_env_batch_size": 512,
235
+ "mode": "train",
236
+ "latency_type": "uniform_distribution",
237
+ "min_latency_ms": 33.333333333333336,
238
+ "max_latency_ms": 100.0,
239
+ "latency_seed": 14,
240
+ "add_latency_info": false,
241
+ "hold_policy": "hold",
242
+ "ordering_policy": "latest_ready",
243
+ "eval_episodes": 100,
244
+ "eval_parallel_envs": 100,
245
+ "eval_max_steps": 36000,
246
+ "eval_deterministic": true,
247
+ "eval_raw_reward": true,
248
+ "episode_metrics_path": "results/checkpoints_factor_sweeps/demon_attack/context_window/demon_attack_frame_stack_uniform_u2_6_fs10_seed14/episode_metrics.jsonl"
249
+ },
250
+ "git_hash": "eb3a2e1efbd2aa03a60d7f44f5e18d8fdd0f5a2d",
251
+ "git_repo_name": "git@github.com:ZihanWang314/latency-sensitive-bench.git",
252
+ "eval_env_frameskip": 1,
253
+ "output_dir": "outputs/factor_sweeps/demon_attack/context_window/train/frame_stack/uniform_u2_6/fs10/seed_14",
254
+ "wandb_unique_id": "demon-attack-fs10-uniform_u2_6-s14"
255
+ }
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/episode_metrics.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/git.diff ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ diff --git a/starVLA b/starVLA
2
+ index ab3380d..9d8c567 160000
3
+ --- a/starVLA
4
+ +++ b/starVLA
5
+ @@ -1 +1 @@
6
+ -Subproject commit ab3380dfbd1de9649c15d154cc41b97788674537
7
+ +Subproject commit 9d8c567188a3aa2a825296016cf17f3977101d8f
factor_sweeps/demon_attack/context_window/train/factor_sweep:demon_attack:frame_stack:uniform_u2_6:fs10:obs15:stride4:seed14/sf_log.txt ADDED
The diff for this file is too large to render. See raw diff