diff --git a/.gitattributes b/.gitattributes
index 7c16e036d39f300a6bff409dc043429e731bb313..2a9e7269db0d10de044a298db10f28c707e3628c 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -42,3 +42,12 @@ wipe_l1_regression/wandb/wandb/run-20251005_163743-a1znetn8/run-a1znetn8.wandb f
cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/run-quokv8gn.wandb filter=lfs diff=lfs merge=lfs -text
cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/run-fqdwkc8m.wandb filter=lfs diff=lfs merge=lfs -text
glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/run-tmwli25x.wandb filter=lfs diff=lfs merge=lfs -text
+glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/run-7ovz4jzt.wandb filter=lfs diff=lfs merge=lfs -text
+eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/run-qzez8pv7.wandb filter=lfs diff=lfs merge=lfs -text
+all_l1/wandb/wandb/run-20250930_131250-ea1k0g3y/run-ea1k0g3y.wandb filter=lfs diff=lfs merge=lfs -text
+all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/run-x94cyrsz.wandb filter=lfs diff=lfs merge=lfs -text
+eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/run-yqnt28c8.wandb filter=lfs diff=lfs merge=lfs -text
+all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/run-3b31u4we.wandb filter=lfs diff=lfs merge=lfs -text
+wipe_flow_matching/wandb/wandb/run-20251005_163812-0cfqmuqw/run-0cfqmuqw.wandb filter=lfs diff=lfs merge=lfs -text
+pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/run-a381qnn9.wandb filter=lfs diff=lfs merge=lfs -text
+cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/run-gqyapbwp.wandb filter=lfs diff=lfs merge=lfs -text
diff --git a/all_flow_matching/glue_best/config.yaml b/all_flow_matching/glue_best/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..d7d6eea24c1bf2969fe7bcb9ae2f53c6e0daacda
--- /dev/null
+++ b/all_flow_matching/glue_best/config.yaml
@@ -0,0 +1,316 @@
+run_name: glue_20250924_082336
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: flow_matching
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: false
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: false
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: true
+lora_rank: 32
+lora_llm: true
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: glue_20250924_082336
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/all_flow_matching/glue_best/step11000-action-head/metadata.pt b/all_flow_matching/glue_best/step11000-action-head/metadata.pt
new file mode 100644
index 0000000000000000000000000000000000000000..4213022058fd255643542ce0165dba7a5c03285e
--- /dev/null
+++ b/all_flow_matching/glue_best/step11000-action-head/metadata.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:91bd03dced0b2509ade669c28c4f205463e4b4e83b54d6726754eeb8ea952bfe
+size 1331
diff --git a/all_flow_matching/glue_best/step11500-action-head/metadata.pt b/all_flow_matching/glue_best/step11500-action-head/metadata.pt
new file mode 100644
index 0000000000000000000000000000000000000000..4e34304d65d6217c2b0a33ee0a75ccecc5e8f82c
--- /dev/null
+++ b/all_flow_matching/glue_best/step11500-action-head/metadata.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7fb72b6306ce04d1beb20bb289509f00c39a40845ff7c4b36bf4deb4e83fe82a
+size 1331
diff --git a/all_flow_matching/glue_best/step11500-unsharded/config.yaml b/all_flow_matching/glue_best/step11500-unsharded/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..415175e1816b20af0f8fe39139f7849a85f694d1
--- /dev/null
+++ b/all_flow_matching/glue_best/step11500-unsharded/config.yaml
@@ -0,0 +1,316 @@
+run_name: glue_20250924_082336
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: flow_matching
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: false
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: false
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: true
+lora_rank: 32
+lora_llm: true
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: glue_20250924_082336
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/all_flow_matching/glue_best/step11500-unsharded/lora.pt b/all_flow_matching/glue_best/step11500-unsharded/lora.pt
new file mode 100644
index 0000000000000000000000000000000000000000..ef6964587bd74b0d3565d65918b9ff63783a6d7d
--- /dev/null
+++ b/all_flow_matching/glue_best/step11500-unsharded/lora.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6269c7cb774e69a5c43b4109cffb347c2936232c5222e2b8a75056ee1188671d
+size 304417027
diff --git a/all_flow_matching/glue_best/step11500-unsharded/train.pt b/all_flow_matching/glue_best/step11500-unsharded/train.pt
new file mode 100644
index 0000000000000000000000000000000000000000..304e866bcbeb62d241e65854fbec30a06ebf883f
--- /dev/null
+++ b/all_flow_matching/glue_best/step11500-unsharded/train.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4b1734f30ac548c86aa66c22a5cfb32bd2320a41d56faab841b4fd53020a6d1b
+size 15061
diff --git a/all_flow_matching/glue_best/step11500/config.yaml b/all_flow_matching/glue_best/step11500/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..415175e1816b20af0f8fe39139f7849a85f694d1
--- /dev/null
+++ b/all_flow_matching/glue_best/step11500/config.yaml
@@ -0,0 +1,316 @@
+run_name: glue_20250924_082336
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: flow_matching
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: false
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: false
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: true
+lora_rank: 32
+lora_llm: true
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: glue_20250924_082336
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/all_flow_matching/glue_best/wandb/wandb/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..e84c27228092453f22934b1211aa4706f57edff5
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/debug-internal.log
@@ -0,0 +1,13 @@
+{"time":"2025-09-24T08:24:16.705237241Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T08:24:17.754431561Z","level":"INFO","msg":"stream: created new stream","id":"4dp69fok"}
+{"time":"2025-09-24T08:24:17.754478082Z","level":"INFO","msg":"stream: started","id":"4dp69fok"}
+{"time":"2025-09-24T08:24:17.754498402Z","level":"INFO","msg":"sender: started","stream_id":"4dp69fok"}
+{"time":"2025-09-24T08:24:17.754506202Z","level":"INFO","msg":"writer: started","stream_id":"4dp69fok"}
+{"time":"2025-09-24T08:24:17.754546793Z","level":"INFO","msg":"handler: started","stream_id":"4dp69fok"}
+{"time":"2025-09-24T15:15:45.267501791Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-09-24T20:24:27.534186056Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-09-25T23:01:28.093149981Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-09-26T02:33:15.940926228Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/4dp69fok/file_stream","body":"\n
\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
+{"time":"2025-09-26T19:36:48.428667728Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/4dp69fok/file_stream","body":"\n\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
+{"time":"2025-09-26T20:06:50.687851553Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-09-26T20:59:26.86775551Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/debug.log b/all_flow_matching/glue_best/wandb/wandb/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_061930-dnrnwv30/run-dnrnwv30.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_061930-dnrnwv30/run-dnrnwv30.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..d2da9e7426e9b1a94e8794debc1685805b43c016
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_061930-dnrnwv30/run-dnrnwv30.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_062357-hmmpns57/run-hmmpns57.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_062357-hmmpns57/run-hmmpns57.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..201bd6c3acb86a6890ae94fee166f4597697f738
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_062357-hmmpns57/run-hmmpns57.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/files/config.yaml b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/files/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..1eb1ed588204d23cd0b097f0aee9a5c4d0fbff20
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/files/config.yaml
@@ -0,0 +1,611 @@
+_wandb:
+ value:
+ cli_version: 0.21.4
+ e:
+ o421nvn5u6ub6ruog26gg83x0g2lmgbt:
+ args:
+ - qwen2_7b
+ - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+ - --vision_backbone
+ - openai
+ - --action_head
+ - flow_matching
+ - --seq_len
+ - "768"
+ - --lora_rank
+ - "32"
+ - --lora_llm
+ - --checkpoint
+ - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+ - --device_train_microbatch_size
+ - "22"
+ - --global_batch_size
+ - "176"
+ - --dataset
+ - vla_dataset_realworld
+ - --llm_learning_rate
+ - "5e-5"
+ - --wandb_entity
+ - henryeap
+ - --wandb_project
+ - a1-realworld
+ - --wandb_run_name
+ - glue
+ - --save_overwrite
+ codePath: launch_scripts/train_vla.py
+ codePathLocal: launch_scripts/train_vla.py
+ cpu_count: 64
+ cpu_count_logical: 128
+ disk:
+ /:
+ total: "470343073792"
+ used: "51147874304"
+ email: ihenrykwok@outlook.com
+ executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10
+ git:
+ commit: c13f2763af61e0d729a8b5ab4bdefc512205bcc5
+ remote: https://github.com/Spatialtemporal-AI/A1.git
+ gpu: Instinct MI210
+ gpu_amd:
+ - id: "5"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x137c9ede1bb1518e"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "7"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x21a2e88d06c419dc"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "2"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x399226d2b2bfa544"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "0"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x3558c3014c813fdb"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "3"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xf61ec17df11883bd"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "1"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x9b5c1c302c8129f8"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "6"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xfa8b85a4625b04f"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "4"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa515afd8ced1d39d"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ gpu_count: 8
+ host: auh7-1b-gpu-188
+ memory:
+ total: "2434606952448"
+ os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35
+ program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py
+ python: CPython 3.10.18
+ root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb
+ slurm:
+ cluster_name: ai-04r
+ conf: /etc/slurm/slurm.conf
+ cpus_on_node: "128"
+ gpus_on_node: "8"
+ gtids: "0"
+ job_account: faculty-acc
+ job_cpus_per_node: "128"
+ job_end_time: "1758954648"
+ job_gid: "2000"
+ job_gpus: 0,1,2,3,4,5,6,7
+ job_id: "1605"
+ job_name: realworld_mh
+ job_nodelist: auh7-1b-gpu-188
+ job_num_nodes: "1"
+ job_partition: faculty
+ job_qos: xdqos
+ job_start_time: "1758695448"
+ job_uid: "2013"
+ job_user: xiaodan
+ jobid: "1605"
+ localid: "0"
+ nnodes: "1"
+ nodeid: "0"
+ nodelist: auh7-1b-gpu-188
+ nprocs: "1"
+ ntasks: "1"
+ ntasks_per_node: "1"
+ oom_kill_step: "0"
+ prio_process: "0"
+ procid: "0"
+ submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts
+ submit_host: auh-1b-cpu-login-001
+ task_pid: "2191329"
+ tasks_per_node: "1"
+ topology_addr: auh7-1b-gpu-188
+ topology_addr_pattern: node
+ startedAt: "2025-09-24T06:31:28.005264Z"
+ writerId: o421nvn5u6ub6ruog26gg83x0g2lmgbt
+ m: []
+ python_version: 3.10.18
+ t:
+ "1":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "2":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "3":
+ - 13
+ - 15
+ - 16
+ "4": 3.10.18
+ "5": 0.21.4
+ "6": 4.56.1
+ "12": 0.21.4
+ "13": linux-x86_64
+activation_checkpointing:
+ value: whole_layer
+allow_resume:
+ value: false
+batch_divisor:
+ value: global_batch
+canceled_check_interval:
+ value: 50
+checkpoint_dir:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+compile:
+ value: null
+console_log_interval:
+ value: 1
+data:
+ value:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: null
+ lerobot_episode_index_start: null
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: false
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: 95818
+ sequence_length: 768
+ shuffle: true
+ shuffle_messages: false
+ split: train
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+device_eval_batch_size:
+ value: 4
+device_inf_eval_batch_size:
+ value: 16
+device_train_batch_size:
+ value: 22
+device_train_grad_accum:
+ value: 1
+device_train_microbatch_size:
+ value: 22
+dry_run:
+ value: false
+early_exit:
+ value: false
+epoch:
+ value: null
+eval_interval:
+ value: 0
+eval_on_load:
+ value: false
+eval_subset_num_batches:
+ value: -1
+evaluators:
+ value:
+ - data:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: 765
+ lerobot_episode_index_start: 353
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: true
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: null
+ sequence_length: 768
+ shuffle: false
+ shuffle_messages: false
+ split: validation
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+ device_eval_batch_size: null
+ eval_name: null
+ label: val
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ skip_if_metrics_cached: true
+ subset_num_batches: 64
+extra_steps_after_cancel:
+ value: 10
+fast_forward_batches:
+ value: null
+force_save_unsharded:
+ value: false
+fsdp:
+ value:
+ hybrid_sharding_num_model_replicas: null
+ precision: float
+ sharding_strategy: FULL_SHARD
+ use_orig_params: true
+ wrapping_strategy: by_block_and_size
+ft_connector:
+ value: false
+ft_embedding:
+ value: lm_head
+ft_llm:
+ value: false
+ft_vit:
+ value: false
+fused_loss:
+ value: null
+gen1_gc_interval:
+ value: 1
+global_train_batch_size:
+ value: 176
+inf_eval_interval:
+ value: -1
+inf_eval_subset_num_batches:
+ value: -1
+inf_evaluators:
+ value: []
+initial_model_checkpoint:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+keep_lr_on_load:
+ value: true
+load_model_config:
+ value: null
+load_path:
+ value: null
+load_path_sharded_checkpointer:
+ value: null
+lora:
+ value: false
+lora_connector:
+ value: false
+lora_llm:
+ value: true
+lora_rank:
+ value: 32
+lora_vit:
+ value: false
+max_duration:
+ value: 500000
+max_grad_norm:
+ value: 1
+max_grad_norm_ratio:
+ value: null
+model:
+ value:
+ action_head: flow_matching
+ action_head_dit_depth: 28
+ action_head_dit_hidden_size: 1152
+ action_head_dit_num_heads: 16
+ action_use_left_eef: false
+ action_use_mobile_base: false
+ activation_type: swiglu
+ additional_vocab_size: 128
+ always_start_with_space: true
+ attention_dropout: 0
+ attention_layer_norm: false
+ attention_layer_norm_with_affine: true
+ attention_type: sdpa
+ bias_for_layer_norm: null
+ block_group_size: 1
+ block_type: sequential
+ clip_qkv: null
+ crop_mode: overlap-and-resize-c2
+ d_model: 3584
+ default_inference_len: 65
+ embedding_dropout: 0
+ embedding_size: 152064
+ fix_image_padding: true
+ float32_attention: true
+ head_dim: null
+ image_feature_dropout: 0
+ image_padding_embed: pad_and_partial_pad
+ image_pooling_2d: attention_meanq
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_projector: mlp
+ include_bias: false
+ init_cutoff_factor: null
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ initializer_range: 0.02
+ layer_norm_eps: 1e-06
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ llm_causal_attention: false
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ max_crops: 12
+ max_position_embeddings: null
+ max_sequence_length: 4096
+ message_formatting: role
+ mlp_hidden_size: 37888
+ mlp_ratio: 4
+ moe_capacity_factor: 1.25
+ moe_dropless: true
+ moe_interleave: false
+ moe_lbl_in_fp32: false
+ moe_log_expert_assignment: false
+ moe_loss_weight: 0.1
+ moe_mlp_impl: sparse
+ moe_num_experts: 8
+ moe_shared_expert: false
+ moe_top_k: 2
+ moe_zloss_weight: null
+ multi_annotation_weighting: root_subsegments
+ n_heads: 28
+ n_kv_heads: 4
+ n_layers: 28
+ new_embedding_init_range: 0.02
+ norm_after: false
+ normalize_input_embeds: false
+ num_diffusion_inference_steps: 30
+ num_diffusion_steps: 1000
+ overlap_margins:
+ - 4
+ - 4
+ pad_tokenizer: true
+ pad_value: 0
+ precision: amp_bf16
+ prompt_type: uber_model
+ qkv_bias: true
+ residual_dropout: 0.1
+ response_residual_dropout: 0
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1e+06
+ scale_logits: false
+ system_prompt_kind: demo_or_style
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ use_col_tokens: true
+ use_position_ids: true
+ use_proprio: true
+ vision_backbone:
+ attention_dropout: 0
+ fsdp_wrap: false
+ image_default_input_size:
+ - 336
+ - 336
+ image_dropout_rate: 0
+ image_emb_dim: 1024
+ image_head_dim: 64
+ image_mlp_activations: quick_gelu
+ image_mlp_dim: 4096
+ image_model_type: openai
+ image_norm_eps: 1e-05
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_num_pos: 577
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ initializer_range: 0.02
+ residual_dropout: 0
+ resize_mode: default
+ vit_layers:
+ - -2
+ - -9
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ vocab_size: 152064
+ weight_tying: false
+multi_component_grad_norm:
+ value: true
+no_pre_train_checkpoint:
+ value: true
+optimizer:
+ value:
+ betas:
+ - 0.9
+ - 0.95
+ connector_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1e-06
+ connector_learning_rate: 0.0002
+ connector_weight_decay: 0
+ eps: 1e-05
+ learning_rate: 0.0001
+ llm_betas:
+ - 0.9
+ - 0.95
+ llm_eps: 1e-06
+ llm_learning_rate: 5e-05
+ llm_weight_decay: 0
+ metrics_log_interval: 20
+ name: adamw
+ vit_betas:
+ - 0.9
+ - 0.95
+ vit_eps: 1e-06
+ vit_learning_rate: 6e-06
+ vit_weight_decay: 0
+ weight_decay: 0.01
+precision:
+ value: amp_bf16
+python_profiling:
+ value: false
+remote_save_folder:
+ value: null
+reset_dataloader_state:
+ value: false
+reset_optimizer_state:
+ value: false
+reset_trainer_state:
+ value: false
+restore_dataloader:
+ value: true
+run_name:
+ value: glue_20250924_063100
+save_dataloader_state:
+ value: false
+save_folder:
+ value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+save_interval:
+ value: 500
+save_interval_action_head:
+ value: 500
+save_interval_ephemeral:
+ value: null
+save_interval_unsharded:
+ value: 500
+save_num_action_head_checkpoints_to_keep:
+ value: 2
+save_num_checkpoints_to_keep:
+ value: 1
+save_num_unsharded_checkpoints_to_keep:
+ value: 1
+save_overwrite:
+ value: true
+scheduler:
+ value:
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ grad_clip_warmup_factor: null
+ grad_clip_warmup_steps: null
+ llm_t_warmup: 2000
+ name: multimodal
+ t_max: null
+ t_warmup: 100
+ units: steps
+ vit_t_warmup: 2000
+ warmup_min_lr: 0
+seed:
+ value: 6198
+sharded_checkpointer:
+ value: torch_legacy
+softmax_auxiliary_loss:
+ value: true
+softmax_auxiliary_loss_scale:
+ value: 0.0001
+speed_monitor:
+ value:
+ gpu_flops_available: null
+ window_size: 20
+stop_after:
+ value: null
+stop_at:
+ value: 500000
+time_limit:
+ value: null
+torch_profiling:
+ value: false
+train_exit_random_layer:
+ value: false
+use_lora:
+ value: true
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..d97b5deaa63e687c945bba56ed8497e474d74344
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/files/output.log
@@ -0,0 +1,33 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [06:31:30] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': 'Lerobot_Glue_best', 'path': '/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/mnt/data2/guominghao/a1/warehouse/glue_lerobot', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [06:31:31] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+09/24 [06:31:32] INFO | >> build_rlds_train_dataset: Loading train dataset: vla_dataset_realworld/train __init__.py:517
+****** Import RLDSBatchTransform, RLDSDataset successfully.
+****** before RLDS dataset...
+****** data_config.rlds_dataset_name: Lerobot_Glue_best
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+Traceback (most recent call last):
+ File "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", line 397, in
+ train(cfg)
+ File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 160, in main
+ train_loader = build_train_dataloader(cfg, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 196, in build_train_dataloader
+ return build_vla_train_dataloader(train_config, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 314, in build_vla_train_dataloader
+ ds = build_rlds_train_dataset(train_config, _normalization_type, _image_augmentation, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 527, in build_rlds_train_dataset
+ dataset = RLDSDataset(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/rlds_datasets.py", line 355, in __init__
+ per_dataset_kwargs, weights = get_oxe_dataset_kwargs_and_weights(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/rlds/oxe/materialize.py", line 119, in get_oxe_dataset_kwargs_and_weights
+ make_oxe_dataset_kwargs(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/rlds/oxe/materialize.py", line 31, in make_oxe_dataset_kwargs
+ dataset_kwargs = deepcopy(OXE_DATASET_CONFIGS[dataset_name])
+KeyError: 'Lerobot_Glue_best'
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/run-wtatxotn.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/run-wtatxotn.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..a21aaa427fc51de5ff1e1a2e3b1097539fc3be63
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063128-wtatxotn/run-wtatxotn.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/config.yaml b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..faef4a4fd8d99630c06f783fb6a8359b3332e6cc
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/config.yaml
@@ -0,0 +1,611 @@
+_wandb:
+ value:
+ cli_version: 0.21.4
+ e:
+ 71y4kqofohuhlolkoekjc4r6f1aprdzt:
+ args:
+ - qwen2_7b
+ - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+ - --vision_backbone
+ - openai
+ - --action_head
+ - flow_matching
+ - --seq_len
+ - "768"
+ - --lora_rank
+ - "32"
+ - --lora_llm
+ - --checkpoint
+ - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+ - --device_train_microbatch_size
+ - "22"
+ - --global_batch_size
+ - "176"
+ - --dataset
+ - vla_dataset_realworld
+ - --llm_learning_rate
+ - "5e-5"
+ - --wandb_entity
+ - henryeap
+ - --wandb_project
+ - a1-realworld
+ - --wandb_run_name
+ - glue
+ - --save_overwrite
+ codePath: launch_scripts/train_vla.py
+ codePathLocal: launch_scripts/train_vla.py
+ cpu_count: 64
+ cpu_count_logical: 128
+ disk:
+ /:
+ total: "470343073792"
+ used: "51148013568"
+ email: ihenrykwok@outlook.com
+ executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10
+ git:
+ commit: c13f2763af61e0d729a8b5ab4bdefc512205bcc5
+ remote: https://github.com/Spatialtemporal-AI/A1.git
+ gpu: Instinct MI210
+ gpu_amd:
+ - id: "1"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x9b5c1c302c8129f8"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "3"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xf61ec17df11883bd"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "5"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x137c9ede1bb1518e"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "6"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xfa8b85a4625b04f"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "0"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x3558c3014c813fdb"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "4"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa515afd8ced1d39d"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "2"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x399226d2b2bfa544"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "7"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x21a2e88d06c419dc"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ gpu_count: 8
+ host: auh7-1b-gpu-188
+ memory:
+ total: "2434606952448"
+ os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35
+ program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py
+ python: CPython 3.10.18
+ root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb
+ slurm:
+ cluster_name: ai-04r
+ conf: /etc/slurm/slurm.conf
+ cpus_on_node: "128"
+ gpus_on_node: "8"
+ gtids: "0"
+ job_account: faculty-acc
+ job_cpus_per_node: "128"
+ job_end_time: "1758954964"
+ job_gid: "2000"
+ job_gpus: 0,1,2,3,4,5,6,7
+ job_id: "1606"
+ job_name: realworld_mh
+ job_nodelist: auh7-1b-gpu-188
+ job_num_nodes: "1"
+ job_partition: faculty
+ job_qos: xdqos
+ job_start_time: "1758695764"
+ job_uid: "2013"
+ job_user: xiaodan
+ jobid: "1606"
+ localid: "0"
+ nnodes: "1"
+ nodeid: "0"
+ nodelist: auh7-1b-gpu-188
+ nprocs: "1"
+ ntasks: "1"
+ ntasks_per_node: "1"
+ oom_kill_step: "0"
+ prio_process: "0"
+ procid: "0"
+ submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts
+ submit_host: auh-1b-cpu-login-001
+ task_pid: "2192665"
+ tasks_per_node: "1"
+ topology_addr: auh7-1b-gpu-188
+ topology_addr_pattern: node
+ startedAt: "2025-09-24T06:36:42.806544Z"
+ writerId: 71y4kqofohuhlolkoekjc4r6f1aprdzt
+ m: []
+ python_version: 3.10.18
+ t:
+ "1":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "2":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "3":
+ - 13
+ - 15
+ - 16
+ "4": 3.10.18
+ "5": 0.21.4
+ "6": 4.56.1
+ "12": 0.21.4
+ "13": linux-x86_64
+activation_checkpointing:
+ value: whole_layer
+allow_resume:
+ value: false
+batch_divisor:
+ value: global_batch
+canceled_check_interval:
+ value: 50
+checkpoint_dir:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+compile:
+ value: null
+console_log_interval:
+ value: 1
+data:
+ value:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: null
+ lerobot_episode_index_start: null
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: false
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: 95818
+ sequence_length: 768
+ shuffle: true
+ shuffle_messages: false
+ split: train
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+device_eval_batch_size:
+ value: 4
+device_inf_eval_batch_size:
+ value: 16
+device_train_batch_size:
+ value: 22
+device_train_grad_accum:
+ value: 1
+device_train_microbatch_size:
+ value: 22
+dry_run:
+ value: false
+early_exit:
+ value: false
+epoch:
+ value: null
+eval_interval:
+ value: 0
+eval_on_load:
+ value: false
+eval_subset_num_batches:
+ value: -1
+evaluators:
+ value:
+ - data:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: 765
+ lerobot_episode_index_start: 353
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: true
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: null
+ sequence_length: 768
+ shuffle: false
+ shuffle_messages: false
+ split: validation
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+ device_eval_batch_size: null
+ eval_name: null
+ label: val
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ skip_if_metrics_cached: true
+ subset_num_batches: 64
+extra_steps_after_cancel:
+ value: 10
+fast_forward_batches:
+ value: null
+force_save_unsharded:
+ value: false
+fsdp:
+ value:
+ hybrid_sharding_num_model_replicas: null
+ precision: float
+ sharding_strategy: FULL_SHARD
+ use_orig_params: true
+ wrapping_strategy: by_block_and_size
+ft_connector:
+ value: false
+ft_embedding:
+ value: lm_head
+ft_llm:
+ value: false
+ft_vit:
+ value: false
+fused_loss:
+ value: null
+gen1_gc_interval:
+ value: 1
+global_train_batch_size:
+ value: 176
+inf_eval_interval:
+ value: -1
+inf_eval_subset_num_batches:
+ value: -1
+inf_evaluators:
+ value: []
+initial_model_checkpoint:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+keep_lr_on_load:
+ value: true
+load_model_config:
+ value: null
+load_path:
+ value: null
+load_path_sharded_checkpointer:
+ value: null
+lora:
+ value: false
+lora_connector:
+ value: false
+lora_llm:
+ value: true
+lora_rank:
+ value: 32
+lora_vit:
+ value: false
+max_duration:
+ value: 500000
+max_grad_norm:
+ value: 1
+max_grad_norm_ratio:
+ value: null
+model:
+ value:
+ action_head: flow_matching
+ action_head_dit_depth: 28
+ action_head_dit_hidden_size: 1152
+ action_head_dit_num_heads: 16
+ action_use_left_eef: false
+ action_use_mobile_base: false
+ activation_type: swiglu
+ additional_vocab_size: 128
+ always_start_with_space: true
+ attention_dropout: 0
+ attention_layer_norm: false
+ attention_layer_norm_with_affine: true
+ attention_type: sdpa
+ bias_for_layer_norm: null
+ block_group_size: 1
+ block_type: sequential
+ clip_qkv: null
+ crop_mode: overlap-and-resize-c2
+ d_model: 3584
+ default_inference_len: 65
+ embedding_dropout: 0
+ embedding_size: 152064
+ fix_image_padding: true
+ float32_attention: true
+ head_dim: null
+ image_feature_dropout: 0
+ image_padding_embed: pad_and_partial_pad
+ image_pooling_2d: attention_meanq
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_projector: mlp
+ include_bias: false
+ init_cutoff_factor: null
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ initializer_range: 0.02
+ layer_norm_eps: 1e-06
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ llm_causal_attention: false
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ max_crops: 12
+ max_position_embeddings: null
+ max_sequence_length: 4096
+ message_formatting: role
+ mlp_hidden_size: 37888
+ mlp_ratio: 4
+ moe_capacity_factor: 1.25
+ moe_dropless: true
+ moe_interleave: false
+ moe_lbl_in_fp32: false
+ moe_log_expert_assignment: false
+ moe_loss_weight: 0.1
+ moe_mlp_impl: sparse
+ moe_num_experts: 8
+ moe_shared_expert: false
+ moe_top_k: 2
+ moe_zloss_weight: null
+ multi_annotation_weighting: root_subsegments
+ n_heads: 28
+ n_kv_heads: 4
+ n_layers: 28
+ new_embedding_init_range: 0.02
+ norm_after: false
+ normalize_input_embeds: false
+ num_diffusion_inference_steps: 30
+ num_diffusion_steps: 1000
+ overlap_margins:
+ - 4
+ - 4
+ pad_tokenizer: true
+ pad_value: 0
+ precision: amp_bf16
+ prompt_type: uber_model
+ qkv_bias: true
+ residual_dropout: 0.1
+ response_residual_dropout: 0
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1e+06
+ scale_logits: false
+ system_prompt_kind: demo_or_style
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ use_col_tokens: true
+ use_position_ids: true
+ use_proprio: true
+ vision_backbone:
+ attention_dropout: 0
+ fsdp_wrap: false
+ image_default_input_size:
+ - 336
+ - 336
+ image_dropout_rate: 0
+ image_emb_dim: 1024
+ image_head_dim: 64
+ image_mlp_activations: quick_gelu
+ image_mlp_dim: 4096
+ image_model_type: openai
+ image_norm_eps: 1e-05
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_num_pos: 577
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ initializer_range: 0.02
+ residual_dropout: 0
+ resize_mode: default
+ vit_layers:
+ - -2
+ - -9
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ vocab_size: 152064
+ weight_tying: false
+multi_component_grad_norm:
+ value: true
+no_pre_train_checkpoint:
+ value: true
+optimizer:
+ value:
+ betas:
+ - 0.9
+ - 0.95
+ connector_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1e-06
+ connector_learning_rate: 0.0002
+ connector_weight_decay: 0
+ eps: 1e-05
+ learning_rate: 0.0001
+ llm_betas:
+ - 0.9
+ - 0.95
+ llm_eps: 1e-06
+ llm_learning_rate: 5e-05
+ llm_weight_decay: 0
+ metrics_log_interval: 20
+ name: adamw
+ vit_betas:
+ - 0.9
+ - 0.95
+ vit_eps: 1e-06
+ vit_learning_rate: 6e-06
+ vit_weight_decay: 0
+ weight_decay: 0.01
+precision:
+ value: amp_bf16
+python_profiling:
+ value: false
+remote_save_folder:
+ value: null
+reset_dataloader_state:
+ value: false
+reset_optimizer_state:
+ value: false
+reset_trainer_state:
+ value: false
+restore_dataloader:
+ value: true
+run_name:
+ value: glue_20250924_063615
+save_dataloader_state:
+ value: false
+save_folder:
+ value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+save_interval:
+ value: 500
+save_interval_action_head:
+ value: 500
+save_interval_ephemeral:
+ value: null
+save_interval_unsharded:
+ value: 500
+save_num_action_head_checkpoints_to_keep:
+ value: 2
+save_num_checkpoints_to_keep:
+ value: 1
+save_num_unsharded_checkpoints_to_keep:
+ value: 1
+save_overwrite:
+ value: true
+scheduler:
+ value:
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ grad_clip_warmup_factor: null
+ grad_clip_warmup_steps: null
+ llm_t_warmup: 2000
+ name: multimodal
+ t_max: null
+ t_warmup: 100
+ units: steps
+ vit_t_warmup: 2000
+ warmup_min_lr: 0
+seed:
+ value: 6198
+sharded_checkpointer:
+ value: torch_legacy
+softmax_auxiliary_loss:
+ value: true
+softmax_auxiliary_loss_scale:
+ value: 0.0001
+speed_monitor:
+ value:
+ gpu_flops_available: null
+ window_size: 20
+stop_after:
+ value: null
+stop_at:
+ value: 500000
+time_limit:
+ value: null
+torch_profiling:
+ value: false
+train_exit_random_layer:
+ value: false
+use_lora:
+ value: true
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..ed326e21e6dcbbdec975b81458ac57451dd50850
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/output.log
@@ -0,0 +1,33 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [06:36:44] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': 'Lerobot_Glue_best', 'path': '/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1', 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/mnt/data2/guominghao/a1/warehouse/glue_lerobot', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [06:36:46] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+09/24 [06:36:47] INFO | >> build_rlds_train_dataset: Loading train dataset: vla_dataset_realworld/train __init__.py:517
+****** Import RLDSBatchTransform, RLDSDataset successfully.
+****** before RLDS dataset...
+****** data_config.rlds_dataset_name: Lerobot_Glue_best
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1
+Traceback (most recent call last):
+ File "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", line 397, in
+ train(cfg)
+ File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 160, in main
+ train_loader = build_train_dataloader(cfg, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 196, in build_train_dataloader
+ return build_vla_train_dataloader(train_config, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 314, in build_vla_train_dataloader
+ ds = build_rlds_train_dataset(train_config, _normalization_type, _image_augmentation, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 527, in build_rlds_train_dataset
+ dataset = RLDSDataset(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/rlds_datasets.py", line 355, in __init__
+ per_dataset_kwargs, weights = get_oxe_dataset_kwargs_and_weights(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/rlds/oxe/materialize.py", line 119, in get_oxe_dataset_kwargs_and_weights
+ make_oxe_dataset_kwargs(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/rlds/oxe/materialize.py", line 31, in make_oxe_dataset_kwargs
+ dataset_kwargs = deepcopy(OXE_DATASET_CONFIGS[dataset_name])
+KeyError: 'Lerobot_Glue_best'
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..9cf6722896b8682405e32a4100d835a5be0f3ae2
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/requirements.txt
@@ -0,0 +1,283 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+numpy==2.2.6
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..f6d743b566613e728d857eb388a5c442e718ad67
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T06:36:42.806544Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "768",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "22",
+ "--global_batch_size",
+ "176",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-188",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "51148013568"
+ }
+ },
+ "memory": {
+ "total": "2434606952448"
+ },
+ "gpu_amd": [
+ {
+ "id": "1",
+ "uniqueId": "0x9b5c1c302c8129f8",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0xf61ec17df11883bd",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x137c9ede1bb1518e",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xfa8b85a4625b04f",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x3558c3014c813fdb",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xa515afd8ced1d39d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0x399226d2b2bfa544",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x21a2e88d06c419dc",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758954964",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1606",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-188",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758695764",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1606",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-188",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "2192665",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-188",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "71y4kqofohuhlolkoekjc4r6f1aprdzt"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/wandb-summary.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/wandb-summary.json
new file mode 100644
index 0000000000000000000000000000000000000000..5031a3fdb5637a89ebf85a0681ed18b6e711fde3
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/files/wandb-summary.json
@@ -0,0 +1 @@
+{"_runtime":2,"_wandb":{"runtime":2}}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..5c17f07c64f4de4919629ca548e01abe9c2627d8
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/logs/debug-internal.log
@@ -0,0 +1,11 @@
+{"time":"2025-09-24T06:36:43.051707086Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T06:36:44.180319507Z","level":"INFO","msg":"stream: created new stream","id":"6tj2c8pr"}
+{"time":"2025-09-24T06:36:44.180366367Z","level":"INFO","msg":"stream: started","id":"6tj2c8pr"}
+{"time":"2025-09-24T06:36:44.180386688Z","level":"INFO","msg":"writer: started","stream_id":"6tj2c8pr"}
+{"time":"2025-09-24T06:36:44.180391338Z","level":"INFO","msg":"handler: started","stream_id":"6tj2c8pr"}
+{"time":"2025-09-24T06:36:44.180402908Z","level":"INFO","msg":"sender: started","stream_id":"6tj2c8pr"}
+{"time":"2025-09-24T06:36:47.096300319Z","level":"INFO","msg":"stream: closing","id":"6tj2c8pr"}
+{"time":"2025-09-24T06:36:48.366366183Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2025-09-24T06:36:48.706218134Z","level":"INFO","msg":"handler: closed","stream_id":"6tj2c8pr"}
+{"time":"2025-09-24T06:36:48.707592142Z","level":"INFO","msg":"sender: closed","stream_id":"6tj2c8pr"}
+{"time":"2025-09-24T06:36:48.707612462Z","level":"INFO","msg":"stream: closed","id":"6tj2c8pr"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/run-6tj2c8pr.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/run-6tj2c8pr.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..ac37fee0df4d5d3a0eae9a3ea4cdfbbdd12826f6
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_063642-6tj2c8pr/run-6tj2c8pr.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/config.yaml b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..4b49b68947dd24fe5ec597ad1d5d8773e8ecf53c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/config.yaml
@@ -0,0 +1,611 @@
+_wandb:
+ value:
+ cli_version: 0.21.4
+ e:
+ ym1fr90agfv5lp1xadwns4zfs5lnvysu:
+ args:
+ - qwen2_7b
+ - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+ - --vision_backbone
+ - openai
+ - --action_head
+ - flow_matching
+ - --seq_len
+ - "768"
+ - --lora_rank
+ - "32"
+ - --lora_llm
+ - --checkpoint
+ - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+ - --device_train_microbatch_size
+ - "22"
+ - --global_batch_size
+ - "176"
+ - --dataset
+ - vla_dataset_realworld
+ - --llm_learning_rate
+ - "5e-5"
+ - --wandb_entity
+ - henryeap
+ - --wandb_project
+ - a1-realworld
+ - --wandb_run_name
+ - glue
+ - --save_overwrite
+ codePath: launch_scripts/train_vla.py
+ codePathLocal: launch_scripts/train_vla.py
+ cpu_count: 64
+ cpu_count_logical: 128
+ disk:
+ /:
+ total: "470343073792"
+ used: "51148275712"
+ email: ihenrykwok@outlook.com
+ executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10
+ git:
+ commit: c13f2763af61e0d729a8b5ab4bdefc512205bcc5
+ remote: https://github.com/Spatialtemporal-AI/A1.git
+ gpu: Instinct MI210
+ gpu_amd:
+ - id: "2"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x399226d2b2bfa544"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "0"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x3558c3014c813fdb"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "4"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa515afd8ced1d39d"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "5"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x137c9ede1bb1518e"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "6"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xfa8b85a4625b04f"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "7"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x21a2e88d06c419dc"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "1"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x9b5c1c302c8129f8"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "3"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xf61ec17df11883bd"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ gpu_count: 8
+ host: auh7-1b-gpu-188
+ memory:
+ total: "2434606952448"
+ os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35
+ program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py
+ python: CPython 3.10.18
+ root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb
+ slurm:
+ cluster_name: ai-04r
+ conf: /etc/slurm/slurm.conf
+ cpus_on_node: "128"
+ gpus_on_node: "8"
+ gtids: "0"
+ job_account: faculty-acc
+ job_cpus_per_node: "128"
+ job_end_time: "1758955952"
+ job_gid: "2000"
+ job_gpus: 0,1,2,3,4,5,6,7
+ job_id: "1607"
+ job_name: realworld_mh
+ job_nodelist: auh7-1b-gpu-188
+ job_num_nodes: "1"
+ job_partition: faculty
+ job_qos: xdqos
+ job_start_time: "1758696752"
+ job_uid: "2013"
+ job_user: xiaodan
+ jobid: "1607"
+ localid: "0"
+ nnodes: "1"
+ nodeid: "0"
+ nodelist: auh7-1b-gpu-188
+ nprocs: "1"
+ ntasks: "1"
+ ntasks_per_node: "1"
+ oom_kill_step: "0"
+ prio_process: "0"
+ procid: "0"
+ submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts
+ submit_host: auh-1b-cpu-login-001
+ task_pid: "2194698"
+ tasks_per_node: "1"
+ topology_addr: auh7-1b-gpu-188
+ topology_addr_pattern: node
+ startedAt: "2025-09-24T06:53:10.958875Z"
+ writerId: ym1fr90agfv5lp1xadwns4zfs5lnvysu
+ m: []
+ python_version: 3.10.18
+ t:
+ "1":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "2":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "3":
+ - 13
+ - 15
+ - 16
+ "4": 3.10.18
+ "5": 0.21.4
+ "6": 4.56.1
+ "12": 0.21.4
+ "13": linux-x86_64
+activation_checkpointing:
+ value: whole_layer
+allow_resume:
+ value: false
+batch_divisor:
+ value: global_batch
+canceled_check_interval:
+ value: 50
+checkpoint_dir:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+compile:
+ value: null
+console_log_interval:
+ value: 1
+data:
+ value:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: null
+ lerobot_episode_index_start: null
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: false
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: 95818
+ sequence_length: 768
+ shuffle: true
+ shuffle_messages: false
+ split: train
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+device_eval_batch_size:
+ value: 4
+device_inf_eval_batch_size:
+ value: 16
+device_train_batch_size:
+ value: 22
+device_train_grad_accum:
+ value: 1
+device_train_microbatch_size:
+ value: 22
+dry_run:
+ value: false
+early_exit:
+ value: false
+epoch:
+ value: null
+eval_interval:
+ value: 0
+eval_on_load:
+ value: false
+eval_subset_num_batches:
+ value: -1
+evaluators:
+ value:
+ - data:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: 765
+ lerobot_episode_index_start: 353
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: true
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: null
+ sequence_length: 768
+ shuffle: false
+ shuffle_messages: false
+ split: validation
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+ device_eval_batch_size: null
+ eval_name: null
+ label: val
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ skip_if_metrics_cached: true
+ subset_num_batches: 64
+extra_steps_after_cancel:
+ value: 10
+fast_forward_batches:
+ value: null
+force_save_unsharded:
+ value: false
+fsdp:
+ value:
+ hybrid_sharding_num_model_replicas: null
+ precision: float
+ sharding_strategy: FULL_SHARD
+ use_orig_params: true
+ wrapping_strategy: by_block_and_size
+ft_connector:
+ value: false
+ft_embedding:
+ value: lm_head
+ft_llm:
+ value: false
+ft_vit:
+ value: false
+fused_loss:
+ value: null
+gen1_gc_interval:
+ value: 1
+global_train_batch_size:
+ value: 176
+inf_eval_interval:
+ value: -1
+inf_eval_subset_num_batches:
+ value: -1
+inf_evaluators:
+ value: []
+initial_model_checkpoint:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+keep_lr_on_load:
+ value: true
+load_model_config:
+ value: null
+load_path:
+ value: null
+load_path_sharded_checkpointer:
+ value: null
+lora:
+ value: false
+lora_connector:
+ value: false
+lora_llm:
+ value: true
+lora_rank:
+ value: 32
+lora_vit:
+ value: false
+max_duration:
+ value: 500000
+max_grad_norm:
+ value: 1
+max_grad_norm_ratio:
+ value: null
+model:
+ value:
+ action_head: flow_matching
+ action_head_dit_depth: 28
+ action_head_dit_hidden_size: 1152
+ action_head_dit_num_heads: 16
+ action_use_left_eef: false
+ action_use_mobile_base: false
+ activation_type: swiglu
+ additional_vocab_size: 128
+ always_start_with_space: true
+ attention_dropout: 0
+ attention_layer_norm: false
+ attention_layer_norm_with_affine: true
+ attention_type: sdpa
+ bias_for_layer_norm: null
+ block_group_size: 1
+ block_type: sequential
+ clip_qkv: null
+ crop_mode: overlap-and-resize-c2
+ d_model: 3584
+ default_inference_len: 65
+ embedding_dropout: 0
+ embedding_size: 152064
+ fix_image_padding: true
+ float32_attention: true
+ head_dim: null
+ image_feature_dropout: 0
+ image_padding_embed: pad_and_partial_pad
+ image_pooling_2d: attention_meanq
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_projector: mlp
+ include_bias: false
+ init_cutoff_factor: null
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ initializer_range: 0.02
+ layer_norm_eps: 1e-06
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ llm_causal_attention: false
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ max_crops: 12
+ max_position_embeddings: null
+ max_sequence_length: 4096
+ message_formatting: role
+ mlp_hidden_size: 37888
+ mlp_ratio: 4
+ moe_capacity_factor: 1.25
+ moe_dropless: true
+ moe_interleave: false
+ moe_lbl_in_fp32: false
+ moe_log_expert_assignment: false
+ moe_loss_weight: 0.1
+ moe_mlp_impl: sparse
+ moe_num_experts: 8
+ moe_shared_expert: false
+ moe_top_k: 2
+ moe_zloss_weight: null
+ multi_annotation_weighting: root_subsegments
+ n_heads: 28
+ n_kv_heads: 4
+ n_layers: 28
+ new_embedding_init_range: 0.02
+ norm_after: false
+ normalize_input_embeds: false
+ num_diffusion_inference_steps: 30
+ num_diffusion_steps: 1000
+ overlap_margins:
+ - 4
+ - 4
+ pad_tokenizer: true
+ pad_value: 0
+ precision: amp_bf16
+ prompt_type: uber_model
+ qkv_bias: true
+ residual_dropout: 0.1
+ response_residual_dropout: 0
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1e+06
+ scale_logits: false
+ system_prompt_kind: demo_or_style
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ use_col_tokens: true
+ use_position_ids: true
+ use_proprio: true
+ vision_backbone:
+ attention_dropout: 0
+ fsdp_wrap: false
+ image_default_input_size:
+ - 336
+ - 336
+ image_dropout_rate: 0
+ image_emb_dim: 1024
+ image_head_dim: 64
+ image_mlp_activations: quick_gelu
+ image_mlp_dim: 4096
+ image_model_type: openai
+ image_norm_eps: 1e-05
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_num_pos: 577
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ initializer_range: 0.02
+ residual_dropout: 0
+ resize_mode: default
+ vit_layers:
+ - -2
+ - -9
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ vocab_size: 152064
+ weight_tying: false
+multi_component_grad_norm:
+ value: true
+no_pre_train_checkpoint:
+ value: true
+optimizer:
+ value:
+ betas:
+ - 0.9
+ - 0.95
+ connector_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1e-06
+ connector_learning_rate: 0.0002
+ connector_weight_decay: 0
+ eps: 1e-05
+ learning_rate: 0.0001
+ llm_betas:
+ - 0.9
+ - 0.95
+ llm_eps: 1e-06
+ llm_learning_rate: 5e-05
+ llm_weight_decay: 0
+ metrics_log_interval: 20
+ name: adamw
+ vit_betas:
+ - 0.9
+ - 0.95
+ vit_eps: 1e-06
+ vit_learning_rate: 6e-06
+ vit_weight_decay: 0
+ weight_decay: 0.01
+precision:
+ value: amp_bf16
+python_profiling:
+ value: false
+remote_save_folder:
+ value: null
+reset_dataloader_state:
+ value: false
+reset_optimizer_state:
+ value: false
+reset_trainer_state:
+ value: false
+restore_dataloader:
+ value: true
+run_name:
+ value: glue_20250924_065243
+save_dataloader_state:
+ value: false
+save_folder:
+ value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+save_interval:
+ value: 500
+save_interval_action_head:
+ value: 500
+save_interval_ephemeral:
+ value: null
+save_interval_unsharded:
+ value: 500
+save_num_action_head_checkpoints_to_keep:
+ value: 2
+save_num_checkpoints_to_keep:
+ value: 1
+save_num_unsharded_checkpoints_to_keep:
+ value: 1
+save_overwrite:
+ value: true
+scheduler:
+ value:
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ grad_clip_warmup_factor: null
+ grad_clip_warmup_steps: null
+ llm_t_warmup: 2000
+ name: multimodal
+ t_max: null
+ t_warmup: 100
+ units: steps
+ vit_t_warmup: 2000
+ warmup_min_lr: 0
+seed:
+ value: 6198
+sharded_checkpointer:
+ value: torch_legacy
+softmax_auxiliary_loss:
+ value: true
+softmax_auxiliary_loss_scale:
+ value: 0.0001
+speed_monitor:
+ value:
+ gpu_flops_available: null
+ window_size: 20
+stop_after:
+ value: null
+stop_at:
+ value: 500000
+time_limit:
+ value: null
+torch_profiling:
+ value: false
+train_exit_random_layer:
+ value: false
+use_lora:
+ value: true
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..6f45df2889b3391f2d7dfe9de0908f3bd379c312
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/output.log
@@ -0,0 +1,29 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [06:53:12] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [06:53:14] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+09/24 [06:53:15] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+Traceback (most recent call last):
+ File "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", line 397, in
+ train(cfg)
+ File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 160, in main
+ train_loader = build_train_dataloader(cfg, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 196, in build_train_dataloader
+ return build_vla_train_dataloader(train_config, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 327, in build_vla_train_dataloader
+ ds = build_lerobot_train_dataset(train_config, normalization_type,device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 435, in build_lerobot_train_dataset
+ from olmo.data.vla.lerobot_datasets import LeRobotDatasetWrapper
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/lerobot_datasets.py", line 71, in
+ class LeRobotDatasetWrapper(Dataset):
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/lerobot_datasets.py", line 72, in LeRobotDatasetWrapper
+ def __init__(self, dataset_path, chunk_size=NUM_ACTIONS_CHUNK,
+NameError: name 'NUM_ACTIONS_CHUNK' is not defined
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..9cf6722896b8682405e32a4100d835a5be0f3ae2
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/requirements.txt
@@ -0,0 +1,283 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+numpy==2.2.6
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..cf1ea9a3d5eea29f4a5975a0fa2f599fb3b2e2f3
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T06:53:10.958875Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "768",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "22",
+ "--global_batch_size",
+ "176",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-188",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "51148275712"
+ }
+ },
+ "memory": {
+ "total": "2434606952448"
+ },
+ "gpu_amd": [
+ {
+ "id": "2",
+ "uniqueId": "0x399226d2b2bfa544",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x3558c3014c813fdb",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xa515afd8ced1d39d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x137c9ede1bb1518e",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xfa8b85a4625b04f",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x21a2e88d06c419dc",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0x9b5c1c302c8129f8",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0xf61ec17df11883bd",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758955952",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1607",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-188",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758696752",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1607",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-188",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "2194698",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-188",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "ym1fr90agfv5lp1xadwns4zfs5lnvysu"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/wandb-summary.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/wandb-summary.json
new file mode 100644
index 0000000000000000000000000000000000000000..8afb95f49483c85658a334253ad61c5e4b5851ef
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/files/wandb-summary.json
@@ -0,0 +1 @@
+{"_wandb":{"runtime":2},"_runtime":2}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug-core.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..d82981f6e2d3b822f626727a42386bf64ae10573
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug-core.log
@@ -0,0 +1,14 @@
+{"time":"2025-09-24T06:53:11.01260872Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpysryscrf/port-2194776.txt","pid":2194776,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-24T06:53:11.013097116Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":2194776}
+{"time":"2025-09-24T06:53:11.013088106Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2194776-2194946-2300508100/socket","Net":"unix"}}
+{"time":"2025-09-24T06:53:11.195667052Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-24T06:53:11.202657842Z","level":"INFO","msg":"handleInformInit: received","streamId":"qsv5q1hc","id":"1(@)"}
+{"time":"2025-09-24T06:53:12.34562108Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"qsv5q1hc","id":"1(@)"}
+{"time":"2025-09-24T06:53:15.425080291Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
+{"time":"2025-09-24T06:53:15.425127242Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
+{"time":"2025-09-24T06:53:15.425161212Z","level":"INFO","msg":"server is shutting down"}
+{"time":"2025-09-24T06:53:15.425190602Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
+{"time":"2025-09-24T06:53:15.425244213Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-2194776-2194946-2300508100/socket","Net":"unix"}}
+{"time":"2025-09-24T06:53:16.766852773Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
+{"time":"2025-09-24T06:53:16.767200728Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
+{"time":"2025-09-24T06:53:16.767210378Z","level":"INFO","msg":"server is closed"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..a3d36455daa64019166205cb06c4d32beb199da9
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug-internal.log
@@ -0,0 +1,11 @@
+{"time":"2025-09-24T06:53:11.204449275Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T06:53:12.345567379Z","level":"INFO","msg":"stream: created new stream","id":"qsv5q1hc"}
+{"time":"2025-09-24T06:53:12.345615649Z","level":"INFO","msg":"stream: started","id":"qsv5q1hc"}
+{"time":"2025-09-24T06:53:12.34563651Z","level":"INFO","msg":"sender: started","stream_id":"qsv5q1hc"}
+{"time":"2025-09-24T06:53:12.34563539Z","level":"INFO","msg":"writer: started","stream_id":"qsv5q1hc"}
+{"time":"2025-09-24T06:53:12.34568667Z","level":"INFO","msg":"handler: started","stream_id":"qsv5q1hc"}
+{"time":"2025-09-24T06:53:15.425126022Z","level":"INFO","msg":"stream: closing","id":"qsv5q1hc"}
+{"time":"2025-09-24T06:53:16.457729801Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2025-09-24T06:53:16.764520193Z","level":"INFO","msg":"handler: closed","stream_id":"qsv5q1hc"}
+{"time":"2025-09-24T06:53:16.765675218Z","level":"INFO","msg":"sender: closed","stream_id":"qsv5q1hc"}
+{"time":"2025-09-24T06:53:16.765705399Z","level":"INFO","msg":"stream: closed","id":"qsv5q1hc"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..2c2bb4e462e89dd0da3e765cacde1ec15eadf78a
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/logs/debug.log
@@ -0,0 +1 @@
+2025-09-24 06:53:15,425 INFO wandb-AsyncioManager-main:2194776 [service_client.py:_forward_responses():84] Reached EOF.
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/run-qsv5q1hc.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/run-qsv5q1hc.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..a732e85aa203f63179a662705ddc5c96cec6f2fd
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065310-qsv5q1hc/run-qsv5q1hc.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/config.yaml b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..645267e3eb927ab8be45cf0dd0726e7178c3331b
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/config.yaml
@@ -0,0 +1,611 @@
+_wandb:
+ value:
+ cli_version: 0.21.4
+ e:
+ pv6kdvw48bx7dygl9qkpmbu5bsrvk9dc:
+ args:
+ - qwen2_7b
+ - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+ - --vision_backbone
+ - openai
+ - --action_head
+ - flow_matching
+ - --seq_len
+ - "768"
+ - --lora_rank
+ - "32"
+ - --lora_llm
+ - --checkpoint
+ - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+ - --device_train_microbatch_size
+ - "22"
+ - --global_batch_size
+ - "176"
+ - --dataset
+ - vla_dataset_realworld
+ - --llm_learning_rate
+ - "5e-5"
+ - --wandb_entity
+ - henryeap
+ - --wandb_project
+ - a1-realworld
+ - --wandb_run_name
+ - glue
+ - --save_overwrite
+ codePath: launch_scripts/train_vla.py
+ codePathLocal: launch_scripts/train_vla.py
+ cpu_count: 64
+ cpu_count_logical: 128
+ disk:
+ /:
+ total: "470343073792"
+ used: "51148382208"
+ email: ihenrykwok@outlook.com
+ executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10
+ git:
+ commit: c13f2763af61e0d729a8b5ab4bdefc512205bcc5
+ remote: https://github.com/Spatialtemporal-AI/A1.git
+ gpu: Instinct MI210
+ gpu_amd:
+ - id: "0"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x3558c3014c813fdb"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "6"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xfa8b85a4625b04f"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "1"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x9b5c1c302c8129f8"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "2"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x399226d2b2bfa544"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "4"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa515afd8ced1d39d"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "5"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x137c9ede1bb1518e"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "3"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xf61ec17df11883bd"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "7"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x21a2e88d06c419dc"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ gpu_count: 8
+ host: auh7-1b-gpu-188
+ memory:
+ total: "2434606952448"
+ os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35
+ program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py
+ python: CPython 3.10.18
+ root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb
+ slurm:
+ cluster_name: ai-04r
+ conf: /etc/slurm/slurm.conf
+ cpus_on_node: "128"
+ gpus_on_node: "8"
+ gtids: "0"
+ job_account: faculty-acc
+ job_cpus_per_node: "128"
+ job_end_time: "1758956113"
+ job_gid: "2000"
+ job_gpus: 0,1,2,3,4,5,6,7
+ job_id: "1608"
+ job_name: realworld_mh
+ job_nodelist: auh7-1b-gpu-188
+ job_num_nodes: "1"
+ job_partition: faculty
+ job_qos: xdqos
+ job_start_time: "1758696913"
+ job_uid: "2013"
+ job_user: xiaodan
+ jobid: "1608"
+ localid: "0"
+ nnodes: "1"
+ nodeid: "0"
+ nodelist: auh7-1b-gpu-188
+ nprocs: "1"
+ ntasks: "1"
+ ntasks_per_node: "1"
+ oom_kill_step: "0"
+ prio_process: "0"
+ procid: "0"
+ submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts
+ submit_host: auh-1b-cpu-login-001
+ task_pid: "2195813"
+ tasks_per_node: "1"
+ topology_addr: auh7-1b-gpu-188
+ topology_addr_pattern: node
+ startedAt: "2025-09-24T06:55:50.673091Z"
+ writerId: pv6kdvw48bx7dygl9qkpmbu5bsrvk9dc
+ m: []
+ python_version: 3.10.18
+ t:
+ "1":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "2":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "3":
+ - 13
+ - 15
+ - 16
+ "4": 3.10.18
+ "5": 0.21.4
+ "6": 4.56.1
+ "12": 0.21.4
+ "13": linux-x86_64
+activation_checkpointing:
+ value: whole_layer
+allow_resume:
+ value: false
+batch_divisor:
+ value: global_batch
+canceled_check_interval:
+ value: 50
+checkpoint_dir:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+compile:
+ value: null
+console_log_interval:
+ value: 1
+data:
+ value:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: null
+ lerobot_episode_index_start: null
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: false
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: 95818
+ sequence_length: 768
+ shuffle: true
+ shuffle_messages: false
+ split: train
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+device_eval_batch_size:
+ value: 4
+device_inf_eval_batch_size:
+ value: 16
+device_train_batch_size:
+ value: 22
+device_train_grad_accum:
+ value: 1
+device_train_microbatch_size:
+ value: 22
+dry_run:
+ value: false
+early_exit:
+ value: false
+epoch:
+ value: null
+eval_interval:
+ value: 0
+eval_on_load:
+ value: false
+eval_subset_num_batches:
+ value: -1
+evaluators:
+ value:
+ - data:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: 765
+ lerobot_episode_index_start: 353
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: true
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: null
+ sequence_length: 768
+ shuffle: false
+ shuffle_messages: false
+ split: validation
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+ device_eval_batch_size: null
+ eval_name: null
+ label: val
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ skip_if_metrics_cached: true
+ subset_num_batches: 64
+extra_steps_after_cancel:
+ value: 10
+fast_forward_batches:
+ value: null
+force_save_unsharded:
+ value: false
+fsdp:
+ value:
+ hybrid_sharding_num_model_replicas: null
+ precision: float
+ sharding_strategy: FULL_SHARD
+ use_orig_params: true
+ wrapping_strategy: by_block_and_size
+ft_connector:
+ value: false
+ft_embedding:
+ value: lm_head
+ft_llm:
+ value: false
+ft_vit:
+ value: false
+fused_loss:
+ value: null
+gen1_gc_interval:
+ value: 1
+global_train_batch_size:
+ value: 176
+inf_eval_interval:
+ value: -1
+inf_eval_subset_num_batches:
+ value: -1
+inf_evaluators:
+ value: []
+initial_model_checkpoint:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+keep_lr_on_load:
+ value: true
+load_model_config:
+ value: null
+load_path:
+ value: null
+load_path_sharded_checkpointer:
+ value: null
+lora:
+ value: false
+lora_connector:
+ value: false
+lora_llm:
+ value: true
+lora_rank:
+ value: 32
+lora_vit:
+ value: false
+max_duration:
+ value: 500000
+max_grad_norm:
+ value: 1
+max_grad_norm_ratio:
+ value: null
+model:
+ value:
+ action_head: flow_matching
+ action_head_dit_depth: 28
+ action_head_dit_hidden_size: 1152
+ action_head_dit_num_heads: 16
+ action_use_left_eef: false
+ action_use_mobile_base: false
+ activation_type: swiglu
+ additional_vocab_size: 128
+ always_start_with_space: true
+ attention_dropout: 0
+ attention_layer_norm: false
+ attention_layer_norm_with_affine: true
+ attention_type: sdpa
+ bias_for_layer_norm: null
+ block_group_size: 1
+ block_type: sequential
+ clip_qkv: null
+ crop_mode: overlap-and-resize-c2
+ d_model: 3584
+ default_inference_len: 65
+ embedding_dropout: 0
+ embedding_size: 152064
+ fix_image_padding: true
+ float32_attention: true
+ head_dim: null
+ image_feature_dropout: 0
+ image_padding_embed: pad_and_partial_pad
+ image_pooling_2d: attention_meanq
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_projector: mlp
+ include_bias: false
+ init_cutoff_factor: null
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ initializer_range: 0.02
+ layer_norm_eps: 1e-06
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ llm_causal_attention: false
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ max_crops: 12
+ max_position_embeddings: null
+ max_sequence_length: 4096
+ message_formatting: role
+ mlp_hidden_size: 37888
+ mlp_ratio: 4
+ moe_capacity_factor: 1.25
+ moe_dropless: true
+ moe_interleave: false
+ moe_lbl_in_fp32: false
+ moe_log_expert_assignment: false
+ moe_loss_weight: 0.1
+ moe_mlp_impl: sparse
+ moe_num_experts: 8
+ moe_shared_expert: false
+ moe_top_k: 2
+ moe_zloss_weight: null
+ multi_annotation_weighting: root_subsegments
+ n_heads: 28
+ n_kv_heads: 4
+ n_layers: 28
+ new_embedding_init_range: 0.02
+ norm_after: false
+ normalize_input_embeds: false
+ num_diffusion_inference_steps: 30
+ num_diffusion_steps: 1000
+ overlap_margins:
+ - 4
+ - 4
+ pad_tokenizer: true
+ pad_value: 0
+ precision: amp_bf16
+ prompt_type: uber_model
+ qkv_bias: true
+ residual_dropout: 0.1
+ response_residual_dropout: 0
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1e+06
+ scale_logits: false
+ system_prompt_kind: demo_or_style
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ use_col_tokens: true
+ use_position_ids: true
+ use_proprio: true
+ vision_backbone:
+ attention_dropout: 0
+ fsdp_wrap: false
+ image_default_input_size:
+ - 336
+ - 336
+ image_dropout_rate: 0
+ image_emb_dim: 1024
+ image_head_dim: 64
+ image_mlp_activations: quick_gelu
+ image_mlp_dim: 4096
+ image_model_type: openai
+ image_norm_eps: 1e-05
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_num_pos: 577
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ initializer_range: 0.02
+ residual_dropout: 0
+ resize_mode: default
+ vit_layers:
+ - -2
+ - -9
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ vocab_size: 152064
+ weight_tying: false
+multi_component_grad_norm:
+ value: true
+no_pre_train_checkpoint:
+ value: true
+optimizer:
+ value:
+ betas:
+ - 0.9
+ - 0.95
+ connector_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1e-06
+ connector_learning_rate: 0.0002
+ connector_weight_decay: 0
+ eps: 1e-05
+ learning_rate: 0.0001
+ llm_betas:
+ - 0.9
+ - 0.95
+ llm_eps: 1e-06
+ llm_learning_rate: 5e-05
+ llm_weight_decay: 0
+ metrics_log_interval: 20
+ name: adamw
+ vit_betas:
+ - 0.9
+ - 0.95
+ vit_eps: 1e-06
+ vit_learning_rate: 6e-06
+ vit_weight_decay: 0
+ weight_decay: 0.01
+precision:
+ value: amp_bf16
+python_profiling:
+ value: false
+remote_save_folder:
+ value: null
+reset_dataloader_state:
+ value: false
+reset_optimizer_state:
+ value: false
+reset_trainer_state:
+ value: false
+restore_dataloader:
+ value: true
+run_name:
+ value: glue_20250924_065523
+save_dataloader_state:
+ value: false
+save_folder:
+ value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+save_interval:
+ value: 500
+save_interval_action_head:
+ value: 500
+save_interval_ephemeral:
+ value: null
+save_interval_unsharded:
+ value: 500
+save_num_action_head_checkpoints_to_keep:
+ value: 2
+save_num_checkpoints_to_keep:
+ value: 1
+save_num_unsharded_checkpoints_to_keep:
+ value: 1
+save_overwrite:
+ value: true
+scheduler:
+ value:
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ grad_clip_warmup_factor: null
+ grad_clip_warmup_steps: null
+ llm_t_warmup: 2000
+ name: multimodal
+ t_max: null
+ t_warmup: 100
+ units: steps
+ vit_t_warmup: 2000
+ warmup_min_lr: 0
+seed:
+ value: 6198
+sharded_checkpointer:
+ value: torch_legacy
+softmax_auxiliary_loss:
+ value: true
+softmax_auxiliary_loss_scale:
+ value: 0.0001
+speed_monitor:
+ value:
+ gpu_flops_available: null
+ window_size: 20
+stop_after:
+ value: null
+stop_at:
+ value: 500000
+time_limit:
+ value: null
+torch_profiling:
+ value: false
+train_exit_random_layer:
+ value: false
+use_lora:
+ value: true
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..ac244d7e029f16d47dbd1b46ec448f61a897e312
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/output.log
@@ -0,0 +1,47 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [06:55:52] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [06:55:54] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+ INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+Traceback (most recent call last):
+ File "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", line 397, in
+ train(cfg)
+ File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 160, in main
+ train_loader = build_train_dataloader(cfg, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 196, in build_train_dataloader
+ return build_vla_train_dataloader(train_config, device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 327, in build_vla_train_dataloader
+ ds = build_lerobot_train_dataset(train_config, normalization_type,device)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/__init__.py", line 439, in build_lerobot_train_dataset
+ dataset = LeRobotDatasetWrapper(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/vla/lerobot_datasets.py", line 84, in __init__
+ dataset_demo = LeRobotDataset(repo_id=os.path.basename(dataset_path),root=dataset_path)
+ File "/vast/users/xiaodan/zhangjian/lerobot/src/lerobot/datasets/lerobot_dataset.py", line 610, in __init__
+ self.meta = LeRobotDatasetMetadata(
+ File "/vast/users/xiaodan/zhangjian/lerobot/src/lerobot/datasets/lerobot_dataset.py", line 101, in __init__
+ self.load_metadata()
+ File "/vast/users/xiaodan/zhangjian/lerobot/src/lerobot/datasets/lerobot_dataset.py", line 112, in load_metadata
+ check_version_compatibility(self.repo_id, self._version, CODEBASE_VERSION)
+ File "/vast/users/xiaodan/zhangjian/lerobot/src/lerobot/datasets/utils.py", line 487, in check_version_compatibility
+ raise BackwardCompatibilityError(repo_id, v_check)
+lerobot.datasets.backward_compatibility.BackwardCompatibilityError:
+The dataset you requested (Lerobot_Glue_best) is in 2.1 format.
+
+We introduced a new format since v3.0 which is not backward compatible with v2.1.
+Please, update your dataset to the new format using this command:
+```
+python -m lerobot.datasets.v30.convert_dataset_v21_to_v30 --repo-id=Lerobot_Glue_best
+```
+
+If you encounter a problem, contact LeRobot maintainers on [Discord](https://discord.com/invite/s3KuuzsPFb)
+or open an [issue on GitHub](https://github.com/huggingface/lerobot/issues/new/choose).
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..9cf6722896b8682405e32a4100d835a5be0f3ae2
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/requirements.txt
@@ -0,0 +1,283 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+numpy==2.2.6
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..778dd7e6e21c48c20fb07a5ad385f1d2645a6164
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T06:55:50.673091Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "768",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "22",
+ "--global_batch_size",
+ "176",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-188",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "51148382208"
+ }
+ },
+ "memory": {
+ "total": "2434606952448"
+ },
+ "gpu_amd": [
+ {
+ "id": "0",
+ "uniqueId": "0x3558c3014c813fdb",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xfa8b85a4625b04f",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0x9b5c1c302c8129f8",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0x399226d2b2bfa544",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xa515afd8ced1d39d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x137c9ede1bb1518e",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0xf61ec17df11883bd",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x21a2e88d06c419dc",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758956113",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1608",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-188",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758696913",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1608",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-188",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "2195813",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-188",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "pv6kdvw48bx7dygl9qkpmbu5bsrvk9dc"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/wandb-summary.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/wandb-summary.json
new file mode 100644
index 0000000000000000000000000000000000000000..8afb95f49483c85658a334253ad61c5e4b5851ef
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/files/wandb-summary.json
@@ -0,0 +1 @@
+{"_wandb":{"runtime":2},"_runtime":2}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug-core.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..ad4640143771ea70431b958acb7e9706e7be6191
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug-core.log
@@ -0,0 +1,14 @@
+{"time":"2025-09-24T06:55:50.723563798Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpjs8cyprs/port-2195891.txt","pid":2195891,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-24T06:55:50.72450232Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":2195891}
+{"time":"2025-09-24T06:55:50.724421019Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2195891-2196055-1725862429/socket","Net":"unix"}}
+{"time":"2025-09-24T06:55:50.908962781Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-24T06:55:50.915479784Z","level":"INFO","msg":"handleInformInit: received","streamId":"lqn400wc","id":"1(@)"}
+{"time":"2025-09-24T06:55:52.044031974Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"lqn400wc","id":"1(@)"}
+{"time":"2025-09-24T06:55:54.891857034Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
+{"time":"2025-09-24T06:55:54.89233836Z","level":"INFO","msg":"server is shutting down"}
+{"time":"2025-09-24T06:55:54.89233283Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
+{"time":"2025-09-24T06:55:54.89236797Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
+{"time":"2025-09-24T06:55:54.892429561Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-2195891-2196055-1725862429/socket","Net":"unix"}}
+{"time":"2025-09-24T06:55:56.94476761Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
+{"time":"2025-09-24T06:55:56.944779601Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
+{"time":"2025-09-24T06:55:56.944793901Z","level":"INFO","msg":"server is closed"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..f68eaf4b44d880232f6bebfdebef4d44ca49ed02
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug-internal.log
@@ -0,0 +1,11 @@
+{"time":"2025-09-24T06:55:50.917562781Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T06:55:52.043989044Z","level":"INFO","msg":"stream: created new stream","id":"lqn400wc"}
+{"time":"2025-09-24T06:55:52.044025974Z","level":"INFO","msg":"stream: started","id":"lqn400wc"}
+{"time":"2025-09-24T06:55:52.044043335Z","level":"INFO","msg":"handler: started","stream_id":"lqn400wc"}
+{"time":"2025-09-24T06:55:52.044047115Z","level":"INFO","msg":"writer: started","stream_id":"lqn400wc"}
+{"time":"2025-09-24T06:55:52.044082945Z","level":"INFO","msg":"sender: started","stream_id":"lqn400wc"}
+{"time":"2025-09-24T06:55:54.8923419Z","level":"INFO","msg":"stream: closing","id":"lqn400wc"}
+{"time":"2025-09-24T06:55:56.556098297Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2025-09-24T06:55:56.941936164Z","level":"INFO","msg":"handler: closed","stream_id":"lqn400wc"}
+{"time":"2025-09-24T06:55:56.943528235Z","level":"INFO","msg":"sender: closed","stream_id":"lqn400wc"}
+{"time":"2025-09-24T06:55:56.943536815Z","level":"INFO","msg":"stream: closed","id":"lqn400wc"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..ef460cc17d8b7dcdeaef0150925e66a2c6eb5387
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/logs/debug.log
@@ -0,0 +1 @@
+2025-09-24 06:55:54,891 INFO wandb-AsyncioManager-main:2195891 [service_client.py:_forward_responses():84] Reached EOF.
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/run-lqn400wc.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/run-lqn400wc.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..05b7c3eed130597496d9095305a535645d24d2f4
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_065550-lqn400wc/run-lqn400wc.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/config.yaml b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..4de7f00bcf686e248b79f03ae2c3001e292cb02c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/config.yaml
@@ -0,0 +1,615 @@
+_wandb:
+ value:
+ cli_version: 0.21.4
+ e:
+ 1pt1kzn3156onku1dbmbvrh2eyknhblo:
+ args:
+ - qwen2_7b
+ - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+ - --vision_backbone
+ - openai
+ - --action_head
+ - flow_matching
+ - --seq_len
+ - "768"
+ - --lora_rank
+ - "32"
+ - --lora_llm
+ - --checkpoint
+ - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+ - --device_train_microbatch_size
+ - "22"
+ - --global_batch_size
+ - "176"
+ - --dataset
+ - vla_dataset_realworld
+ - --llm_learning_rate
+ - "5e-5"
+ - --wandb_entity
+ - henryeap
+ - --wandb_project
+ - a1-realworld
+ - --wandb_run_name
+ - glue
+ - --save_overwrite
+ codePath: launch_scripts/train_vla.py
+ codePathLocal: launch_scripts/train_vla.py
+ cpu_count: 64
+ cpu_count_logical: 128
+ disk:
+ /:
+ total: "470343073792"
+ used: "50552754176"
+ email: ihenrykwok@outlook.com
+ executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10
+ git:
+ commit: c13f2763af61e0d729a8b5ab4bdefc512205bcc5
+ remote: https://github.com/Spatialtemporal-AI/A1.git
+ gpu: Instinct MI210
+ gpu_amd:
+ - id: "2"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xab01f34fc0edbb6e"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "4"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x37e5d0f3d8682cca"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "1"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xf07610cbfae55ec0"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "3"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x9a76422d710d96e6"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "7"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xe1b4f7497ad1d2db"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "5"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x2e0c5f8d27fbe8f1"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "0"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xca50e2816c5058ba"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "6"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xfaa84ccf6c76f5e3"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ gpu_count: 8
+ host: auh7-1b-gpu-295
+ memory:
+ total: "2434606931968"
+ os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35
+ program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py
+ python: CPython 3.10.18
+ root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb
+ slurm:
+ cluster_name: ai-04r
+ conf: /etc/slurm/slurm.conf
+ cpus_on_node: "128"
+ gpus_on_node: "8"
+ gtids: "0"
+ job_account: faculty-acc
+ job_cpus_per_node: "128"
+ job_end_time: "1758959301"
+ job_gid: "2000"
+ job_gpus: 0,1,2,3,4,5,6,7
+ job_id: "1610"
+ job_name: realworld_mh
+ job_nodelist: auh7-1b-gpu-295
+ job_num_nodes: "1"
+ job_partition: faculty
+ job_qos: xdqos
+ job_start_time: "1758700101"
+ job_uid: "2013"
+ job_user: xiaodan
+ jobid: "1610"
+ localid: "0"
+ nnodes: "1"
+ nodeid: "0"
+ nodelist: auh7-1b-gpu-295
+ nprocs: "1"
+ ntasks: "1"
+ ntasks_per_node: "1"
+ oom_kill_step: "0"
+ prio_process: "0"
+ procid: "0"
+ submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts
+ submit_host: auh-1b-cpu-login-001
+ task_pid: "3944397"
+ tasks_per_node: "1"
+ topology_addr: auh7-1b-gpu-295
+ topology_addr_pattern: node
+ startedAt: "2025-09-24T07:49:27.634943Z"
+ writerId: 1pt1kzn3156onku1dbmbvrh2eyknhblo
+ m: []
+ python_version: 3.10.18
+ t:
+ "1":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "2":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "3":
+ - 2
+ - 13
+ - 15
+ - 16
+ - 61
+ "4": 3.10.18
+ "5": 0.21.4
+ "6": 4.56.1
+ "10":
+ - 19
+ "12": 0.21.4
+ "13": linux-x86_64
+activation_checkpointing:
+ value: whole_layer
+allow_resume:
+ value: false
+batch_divisor:
+ value: global_batch
+canceled_check_interval:
+ value: 50
+checkpoint_dir:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+compile:
+ value: null
+console_log_interval:
+ value: 1
+data:
+ value:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: null
+ lerobot_episode_index_start: null
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: false
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: 95818
+ sequence_length: 768
+ shuffle: true
+ shuffle_messages: false
+ split: train
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+device_eval_batch_size:
+ value: 4
+device_inf_eval_batch_size:
+ value: 16
+device_train_batch_size:
+ value: 22
+device_train_grad_accum:
+ value: 1
+device_train_microbatch_size:
+ value: 22
+dry_run:
+ value: false
+early_exit:
+ value: false
+epoch:
+ value: null
+eval_interval:
+ value: 0
+eval_on_load:
+ value: false
+eval_subset_num_batches:
+ value: -1
+evaluators:
+ value:
+ - data:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: 765
+ lerobot_episode_index_start: 353
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: true
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: null
+ sequence_length: 768
+ shuffle: false
+ shuffle_messages: false
+ split: validation
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+ device_eval_batch_size: null
+ eval_name: null
+ label: val
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ skip_if_metrics_cached: true
+ subset_num_batches: 64
+extra_steps_after_cancel:
+ value: 10
+fast_forward_batches:
+ value: null
+force_save_unsharded:
+ value: false
+fsdp:
+ value:
+ hybrid_sharding_num_model_replicas: null
+ precision: float
+ sharding_strategy: FULL_SHARD
+ use_orig_params: true
+ wrapping_strategy: by_block_and_size
+ft_connector:
+ value: false
+ft_embedding:
+ value: lm_head
+ft_llm:
+ value: false
+ft_vit:
+ value: false
+fused_loss:
+ value: null
+gen1_gc_interval:
+ value: 1
+global_train_batch_size:
+ value: 176
+inf_eval_interval:
+ value: -1
+inf_eval_subset_num_batches:
+ value: -1
+inf_evaluators:
+ value: []
+initial_model_checkpoint:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+keep_lr_on_load:
+ value: true
+load_model_config:
+ value: null
+load_path:
+ value: null
+load_path_sharded_checkpointer:
+ value: null
+lora:
+ value: false
+lora_connector:
+ value: false
+lora_llm:
+ value: true
+lora_rank:
+ value: 32
+lora_vit:
+ value: false
+max_duration:
+ value: 500000
+max_grad_norm:
+ value: 1
+max_grad_norm_ratio:
+ value: null
+model:
+ value:
+ action_head: flow_matching
+ action_head_dit_depth: 28
+ action_head_dit_hidden_size: 1152
+ action_head_dit_num_heads: 16
+ action_use_left_eef: false
+ action_use_mobile_base: false
+ activation_type: swiglu
+ additional_vocab_size: 128
+ always_start_with_space: true
+ attention_dropout: 0
+ attention_layer_norm: false
+ attention_layer_norm_with_affine: true
+ attention_type: sdpa
+ bias_for_layer_norm: null
+ block_group_size: 1
+ block_type: sequential
+ clip_qkv: null
+ crop_mode: overlap-and-resize-c2
+ d_model: 3584
+ default_inference_len: 65
+ embedding_dropout: 0
+ embedding_size: 152064
+ fix_image_padding: true
+ float32_attention: true
+ head_dim: null
+ image_feature_dropout: 0
+ image_padding_embed: pad_and_partial_pad
+ image_pooling_2d: attention_meanq
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_projector: mlp
+ include_bias: false
+ init_cutoff_factor: null
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ initializer_range: 0.02
+ layer_norm_eps: 1e-06
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ llm_causal_attention: false
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ max_crops: 12
+ max_position_embeddings: null
+ max_sequence_length: 4096
+ message_formatting: role
+ mlp_hidden_size: 37888
+ mlp_ratio: 4
+ moe_capacity_factor: 1.25
+ moe_dropless: true
+ moe_interleave: false
+ moe_lbl_in_fp32: false
+ moe_log_expert_assignment: false
+ moe_loss_weight: 0.1
+ moe_mlp_impl: sparse
+ moe_num_experts: 8
+ moe_shared_expert: false
+ moe_top_k: 2
+ moe_zloss_weight: null
+ multi_annotation_weighting: root_subsegments
+ n_heads: 28
+ n_kv_heads: 4
+ n_layers: 28
+ new_embedding_init_range: 0.02
+ norm_after: false
+ normalize_input_embeds: false
+ num_diffusion_inference_steps: 30
+ num_diffusion_steps: 1000
+ overlap_margins:
+ - 4
+ - 4
+ pad_tokenizer: true
+ pad_value: 0
+ precision: amp_bf16
+ prompt_type: uber_model
+ qkv_bias: true
+ residual_dropout: 0.1
+ response_residual_dropout: 0
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1e+06
+ scale_logits: false
+ system_prompt_kind: demo_or_style
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ use_col_tokens: true
+ use_position_ids: true
+ use_proprio: true
+ vision_backbone:
+ attention_dropout: 0
+ fsdp_wrap: false
+ image_default_input_size:
+ - 336
+ - 336
+ image_dropout_rate: 0
+ image_emb_dim: 1024
+ image_head_dim: 64
+ image_mlp_activations: quick_gelu
+ image_mlp_dim: 4096
+ image_model_type: openai
+ image_norm_eps: 1e-05
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_num_pos: 577
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ initializer_range: 0.02
+ residual_dropout: 0
+ resize_mode: default
+ vit_layers:
+ - -2
+ - -9
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ vocab_size: 152064
+ weight_tying: false
+multi_component_grad_norm:
+ value: true
+no_pre_train_checkpoint:
+ value: true
+optimizer:
+ value:
+ betas:
+ - 0.9
+ - 0.95
+ connector_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1e-06
+ connector_learning_rate: 0.0002
+ connector_weight_decay: 0
+ eps: 1e-05
+ learning_rate: 0.0001
+ llm_betas:
+ - 0.9
+ - 0.95
+ llm_eps: 1e-06
+ llm_learning_rate: 5e-05
+ llm_weight_decay: 0
+ metrics_log_interval: 20
+ name: adamw
+ vit_betas:
+ - 0.9
+ - 0.95
+ vit_eps: 1e-06
+ vit_learning_rate: 6e-06
+ vit_weight_decay: 0
+ weight_decay: 0.01
+precision:
+ value: amp_bf16
+python_profiling:
+ value: false
+remote_save_folder:
+ value: null
+reset_dataloader_state:
+ value: false
+reset_optimizer_state:
+ value: false
+reset_trainer_state:
+ value: false
+restore_dataloader:
+ value: true
+run_name:
+ value: glue_20250924_074844
+save_dataloader_state:
+ value: false
+save_folder:
+ value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+save_interval:
+ value: 500
+save_interval_action_head:
+ value: 500
+save_interval_ephemeral:
+ value: null
+save_interval_unsharded:
+ value: 500
+save_num_action_head_checkpoints_to_keep:
+ value: 2
+save_num_checkpoints_to_keep:
+ value: 1
+save_num_unsharded_checkpoints_to_keep:
+ value: 1
+save_overwrite:
+ value: true
+scheduler:
+ value:
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ grad_clip_warmup_factor: null
+ grad_clip_warmup_steps: null
+ llm_t_warmup: 2000
+ name: multimodal
+ t_max: null
+ t_warmup: 100
+ units: steps
+ vit_t_warmup: 2000
+ warmup_min_lr: 0
+seed:
+ value: 6198
+sharded_checkpointer:
+ value: torch_legacy
+softmax_auxiliary_loss:
+ value: true
+softmax_auxiliary_loss_scale:
+ value: 0.0001
+speed_monitor:
+ value:
+ gpu_flops_available: null
+ window_size: 20
+stop_after:
+ value: null
+stop_at:
+ value: 500000
+time_limit:
+ value: null
+torch_profiling:
+ value: false
+train_exit_random_layer:
+ value: false
+use_lora:
+ value: true
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..7d5896d461cf42d68d399ffb590c7b628a297216
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/output.log
@@ -0,0 +1,74 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [07:49:29] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [07:49:31] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+09/24 [07:49:32] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+****** length of the dataset: 17698
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+09/24 [07:49:49] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=True, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Add lora to model.transformer successful!
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* get lora params name: llm_params[0]: blocks.6._fsdp_wrapped_module.ff_out.parametrizations.weight.0.lora_A
+************* After get lora params successfully
+09/24 [07:51:21] INFO | >> Constructing optimizer with 1 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 39071
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=39,071
+!!!Training failed:
+Traceback (most recent call last):
+ File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 593, in main
+ trainer.fit()
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2277, in fit
+ for batch in self.train_loader:
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 734, in __next__
+ data = self._next_data()
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 790, in _next_data
+ data = self._dataset_fetcher.fetch(index) # may raise StopIteration
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py", line 43, in fetch
+ return self.collate_fn(data)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py", line 158, in __call__
+ self._add_action_tokens_to_batch(batch)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py", line 254, in _add_action_tokens_to_batch
+ action_tokens = self._build_action_tokens()
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py", line 337, in _build_action_tokens
+ assert len(right_eef_tokens) == ACTION_DIMS_MAPPING['right_end_effector']
+AssertionError
+wandb: WARNING The `quiet` argument to `wandb.run.finish()` is deprecated, use `wandb.Settings(quiet=...)` to set this instead.
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..d591dba0016b7c501858d0d2d84d7b27acfff58c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/requirements.txt
@@ -0,0 +1,285 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..a95721ef10d8ba04dc6eff75ce19cc54856dd2a0
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T07:49:27.634943Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "768",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "22",
+ "--global_batch_size",
+ "176",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-295",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50552754176"
+ }
+ },
+ "memory": {
+ "total": "2434606931968"
+ },
+ "gpu_amd": [
+ {
+ "id": "2",
+ "uniqueId": "0xab01f34fc0edbb6e",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0x37e5d0f3d8682cca",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0xf07610cbfae55ec0",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x9a76422d710d96e6",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0xe1b4f7497ad1d2db",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x2e0c5f8d27fbe8f1",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0xca50e2816c5058ba",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xfaa84ccf6c76f5e3",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758959301",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1610",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-295",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758700101",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1610",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-295",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "3944397",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-295",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "1pt1kzn3156onku1dbmbvrh2eyknhblo"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/wandb-summary.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/wandb-summary.json
new file mode 100644
index 0000000000000000000000000000000000000000..d37289b216375b58e607c1b45b66467abe030900
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/files/wandb-summary.json
@@ -0,0 +1 @@
+{"_runtime":113.732812458,"System/Peak GPU Memory (MB)":39071.62890625,"_timestamp":1.7587002818870535e+09,"_step":0,"_wandb":{"runtime":113}}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/logs/debug-core.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..f1de6096fee1244a084940bc0106277e2e3b3212
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/logs/debug-core.log
@@ -0,0 +1,16 @@
+{"time":"2025-09-24T07:49:27.889617724Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpsbiq8ish/port-3944478.txt","pid":3944478,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-24T07:49:27.891870094Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3944478}
+{"time":"2025-09-24T07:49:27.892998519Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3944478-3944654-2489211586/socket","Net":"unix"}}
+{"time":"2025-09-24T07:49:28.091672549Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-24T07:49:28.107596353Z","level":"INFO","msg":"handleInformInit: received","streamId":"rwm1qqvr","id":"1(@)"}
+{"time":"2025-09-24T07:49:29.254468509Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"rwm1qqvr","id":"1(@)"}
+{"time":"2025-09-24T07:51:25.363561879Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"rwm1qqvr","id":"1(@)"}
+{"time":"2025-09-24T07:51:25.367101887Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"rwm1qqvr","id":"1(@)"}
+{"time":"2025-09-24T07:51:25.367107627Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
+{"time":"2025-09-24T07:51:25.367113717Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
+{"time":"2025-09-24T07:51:25.367121007Z","level":"INFO","msg":"server is shutting down"}
+{"time":"2025-09-24T07:51:25.367120867Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
+{"time":"2025-09-24T07:51:25.367156617Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
+{"time":"2025-09-24T07:51:25.367160127Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
+{"time":"2025-09-24T07:51:25.367206328Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-3944478-3944654-2489211586/socket","Net":"unix"}}
+{"time":"2025-09-24T07:51:25.367223268Z","level":"INFO","msg":"server is closed"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..86b224065075de5be40afc9516bc2d8aaed07c43
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/logs/debug-internal.log
@@ -0,0 +1,12 @@
+{"time":"2025-09-24T07:49:28.109477949Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T07:49:29.254414398Z","level":"INFO","msg":"stream: created new stream","id":"rwm1qqvr"}
+{"time":"2025-09-24T07:49:29.254462629Z","level":"INFO","msg":"stream: started","id":"rwm1qqvr"}
+{"time":"2025-09-24T07:49:29.254479529Z","level":"INFO","msg":"writer: started","stream_id":"rwm1qqvr"}
+{"time":"2025-09-24T07:49:29.254487509Z","level":"INFO","msg":"handler: started","stream_id":"rwm1qqvr"}
+{"time":"2025-09-24T07:49:29.254512839Z","level":"INFO","msg":"sender: started","stream_id":"rwm1qqvr"}
+{"time":"2025-09-24T07:51:23.341950674Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":1.454277139}],"total_operations":1}}
+{"time":"2025-09-24T07:51:24.999785419Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2025-09-24T07:51:25.363888344Z","level":"INFO","msg":"stream: closing","id":"rwm1qqvr"}
+{"time":"2025-09-24T07:51:25.363901414Z","level":"INFO","msg":"handler: closed","stream_id":"rwm1qqvr"}
+{"time":"2025-09-24T07:51:25.36514555Z","level":"INFO","msg":"sender: closed","stream_id":"rwm1qqvr"}
+{"time":"2025-09-24T07:51:25.36515125Z","level":"INFO","msg":"stream: closed","id":"rwm1qqvr"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/logs/debug.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/run-rwm1qqvr.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/run-rwm1qqvr.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..8b7441a79e6c1c14662958e18d33770763143f5c
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_074927-rwm1qqvr/run-rwm1qqvr.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/config.yaml b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..647a25fa35e7f4d83751b04bc20e3143af078eba
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/config.yaml
@@ -0,0 +1,615 @@
+_wandb:
+ value:
+ cli_version: 0.21.4
+ e:
+ 89offtg18nkl0daugw7ob6ogc3vo0r47:
+ args:
+ - qwen2_7b
+ - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+ - --vision_backbone
+ - openai
+ - --action_head
+ - flow_matching
+ - --seq_len
+ - "768"
+ - --lora_rank
+ - "32"
+ - --lora_llm
+ - --checkpoint
+ - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+ - --device_train_microbatch_size
+ - "22"
+ - --global_batch_size
+ - "176"
+ - --dataset
+ - vla_dataset_realworld
+ - --llm_learning_rate
+ - "5e-5"
+ - --wandb_entity
+ - henryeap
+ - --wandb_project
+ - a1-realworld
+ - --wandb_run_name
+ - glue
+ - --save_overwrite
+ codePath: launch_scripts/train_vla.py
+ codePathLocal: launch_scripts/train_vla.py
+ cpu_count: 64
+ cpu_count_logical: 128
+ disk:
+ /:
+ total: "470343073792"
+ used: "50870067200"
+ email: ihenrykwok@outlook.com
+ executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10
+ git:
+ commit: c13f2763af61e0d729a8b5ab4bdefc512205bcc5
+ remote: https://github.com/Spatialtemporal-AI/A1.git
+ gpu: Instinct MI210
+ gpu_amd:
+ - id: "1"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x51514ecc6ede157"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "2"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xf3ef7b4642ab85b4"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "0"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x7f3568312f929f55"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "3"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x78c4870668ca6f3c"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "6"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa5b5be8f3bb8ee59"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "4"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xd7645877fbcaeda9"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "5"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x29dc055d2883ffc3"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "7"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa98ff96823c37f37"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ gpu_count: 8
+ host: auh7-1b-gpu-310
+ memory:
+ total: "2434606936064"
+ os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35
+ program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py
+ python: CPython 3.10.18
+ root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb
+ slurm:
+ cluster_name: ai-04r
+ conf: /etc/slurm/slurm.conf
+ cpus_on_node: "128"
+ gpus_on_node: "8"
+ gtids: "0"
+ job_account: faculty-acc
+ job_cpus_per_node: "128"
+ job_end_time: "1758959956"
+ job_gid: "2000"
+ job_gpus: 0,1,2,3,4,5,6,7
+ job_id: "1619"
+ job_name: realworld_mh
+ job_nodelist: auh7-1b-gpu-310
+ job_num_nodes: "1"
+ job_partition: faculty
+ job_qos: xdqos
+ job_start_time: "1758700756"
+ job_uid: "2013"
+ job_user: xiaodan
+ jobid: "1619"
+ localid: "0"
+ nnodes: "1"
+ nodeid: "0"
+ nodelist: auh7-1b-gpu-310
+ nprocs: "1"
+ ntasks: "1"
+ ntasks_per_node: "1"
+ oom_kill_step: "0"
+ prio_process: "0"
+ procid: "0"
+ submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts
+ submit_host: auh-1b-cpu-login-001
+ task_pid: "1391516"
+ tasks_per_node: "1"
+ topology_addr: auh7-1b-gpu-310
+ topology_addr_pattern: node
+ startedAt: "2025-09-24T07:59:56.864946Z"
+ writerId: 89offtg18nkl0daugw7ob6ogc3vo0r47
+ m: []
+ python_version: 3.10.18
+ t:
+ "1":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "2":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "3":
+ - 2
+ - 13
+ - 15
+ - 16
+ - 61
+ "4": 3.10.18
+ "5": 0.21.4
+ "6": 4.56.1
+ "10":
+ - 19
+ "12": 0.21.4
+ "13": linux-x86_64
+activation_checkpointing:
+ value: whole_layer
+allow_resume:
+ value: false
+batch_divisor:
+ value: global_batch
+canceled_check_interval:
+ value: 50
+checkpoint_dir:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+compile:
+ value: null
+console_log_interval:
+ value: 1
+data:
+ value:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: null
+ lerobot_episode_index_start: null
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: false
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: 95818
+ sequence_length: 768
+ shuffle: true
+ shuffle_messages: false
+ split: train
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+device_eval_batch_size:
+ value: 4
+device_inf_eval_batch_size:
+ value: 16
+device_train_batch_size:
+ value: 22
+device_train_grad_accum:
+ value: 1
+device_train_microbatch_size:
+ value: 22
+dry_run:
+ value: false
+early_exit:
+ value: false
+epoch:
+ value: null
+eval_interval:
+ value: 0
+eval_on_load:
+ value: false
+eval_subset_num_batches:
+ value: -1
+evaluators:
+ value:
+ - data:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: 765
+ lerobot_episode_index_start: 353
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: true
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: null
+ sequence_length: 768
+ shuffle: false
+ shuffle_messages: false
+ split: validation
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+ device_eval_batch_size: null
+ eval_name: null
+ label: val
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ skip_if_metrics_cached: true
+ subset_num_batches: 64
+extra_steps_after_cancel:
+ value: 10
+fast_forward_batches:
+ value: null
+force_save_unsharded:
+ value: false
+fsdp:
+ value:
+ hybrid_sharding_num_model_replicas: null
+ precision: float
+ sharding_strategy: FULL_SHARD
+ use_orig_params: true
+ wrapping_strategy: by_block_and_size
+ft_connector:
+ value: false
+ft_embedding:
+ value: lm_head
+ft_llm:
+ value: false
+ft_vit:
+ value: false
+fused_loss:
+ value: null
+gen1_gc_interval:
+ value: 1
+global_train_batch_size:
+ value: 176
+inf_eval_interval:
+ value: -1
+inf_eval_subset_num_batches:
+ value: -1
+inf_evaluators:
+ value: []
+initial_model_checkpoint:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+keep_lr_on_load:
+ value: true
+load_model_config:
+ value: null
+load_path:
+ value: null
+load_path_sharded_checkpointer:
+ value: null
+lora:
+ value: false
+lora_connector:
+ value: false
+lora_llm:
+ value: true
+lora_rank:
+ value: 32
+lora_vit:
+ value: false
+max_duration:
+ value: 500000
+max_grad_norm:
+ value: 1
+max_grad_norm_ratio:
+ value: null
+model:
+ value:
+ action_head: flow_matching
+ action_head_dit_depth: 28
+ action_head_dit_hidden_size: 1152
+ action_head_dit_num_heads: 16
+ action_use_left_eef: false
+ action_use_mobile_base: false
+ activation_type: swiglu
+ additional_vocab_size: 128
+ always_start_with_space: true
+ attention_dropout: 0
+ attention_layer_norm: false
+ attention_layer_norm_with_affine: true
+ attention_type: sdpa
+ bias_for_layer_norm: null
+ block_group_size: 1
+ block_type: sequential
+ clip_qkv: null
+ crop_mode: overlap-and-resize-c2
+ d_model: 3584
+ default_inference_len: 65
+ embedding_dropout: 0
+ embedding_size: 152064
+ fix_image_padding: true
+ float32_attention: true
+ head_dim: null
+ image_feature_dropout: 0
+ image_padding_embed: pad_and_partial_pad
+ image_pooling_2d: attention_meanq
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_projector: mlp
+ include_bias: false
+ init_cutoff_factor: null
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ initializer_range: 0.02
+ layer_norm_eps: 1e-06
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ llm_causal_attention: false
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ max_crops: 12
+ max_position_embeddings: null
+ max_sequence_length: 4096
+ message_formatting: role
+ mlp_hidden_size: 37888
+ mlp_ratio: 4
+ moe_capacity_factor: 1.25
+ moe_dropless: true
+ moe_interleave: false
+ moe_lbl_in_fp32: false
+ moe_log_expert_assignment: false
+ moe_loss_weight: 0.1
+ moe_mlp_impl: sparse
+ moe_num_experts: 8
+ moe_shared_expert: false
+ moe_top_k: 2
+ moe_zloss_weight: null
+ multi_annotation_weighting: root_subsegments
+ n_heads: 28
+ n_kv_heads: 4
+ n_layers: 28
+ new_embedding_init_range: 0.02
+ norm_after: false
+ normalize_input_embeds: false
+ num_diffusion_inference_steps: 30
+ num_diffusion_steps: 1000
+ overlap_margins:
+ - 4
+ - 4
+ pad_tokenizer: true
+ pad_value: 0
+ precision: amp_bf16
+ prompt_type: uber_model
+ qkv_bias: true
+ residual_dropout: 0.1
+ response_residual_dropout: 0
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1e+06
+ scale_logits: false
+ system_prompt_kind: demo_or_style
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ use_col_tokens: true
+ use_position_ids: true
+ use_proprio: true
+ vision_backbone:
+ attention_dropout: 0
+ fsdp_wrap: false
+ image_default_input_size:
+ - 336
+ - 336
+ image_dropout_rate: 0
+ image_emb_dim: 1024
+ image_head_dim: 64
+ image_mlp_activations: quick_gelu
+ image_mlp_dim: 4096
+ image_model_type: openai
+ image_norm_eps: 1e-05
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_num_pos: 577
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ initializer_range: 0.02
+ residual_dropout: 0
+ resize_mode: default
+ vit_layers:
+ - -2
+ - -9
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ vocab_size: 152064
+ weight_tying: false
+multi_component_grad_norm:
+ value: true
+no_pre_train_checkpoint:
+ value: true
+optimizer:
+ value:
+ betas:
+ - 0.9
+ - 0.95
+ connector_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1e-06
+ connector_learning_rate: 0.0002
+ connector_weight_decay: 0
+ eps: 1e-05
+ learning_rate: 0.0001
+ llm_betas:
+ - 0.9
+ - 0.95
+ llm_eps: 1e-06
+ llm_learning_rate: 5e-05
+ llm_weight_decay: 0
+ metrics_log_interval: 20
+ name: adamw
+ vit_betas:
+ - 0.9
+ - 0.95
+ vit_eps: 1e-06
+ vit_learning_rate: 6e-06
+ vit_weight_decay: 0
+ weight_decay: 0.01
+precision:
+ value: amp_bf16
+python_profiling:
+ value: false
+remote_save_folder:
+ value: null
+reset_dataloader_state:
+ value: false
+reset_optimizer_state:
+ value: false
+reset_trainer_state:
+ value: false
+restore_dataloader:
+ value: true
+run_name:
+ value: glue_20250924_075928
+save_dataloader_state:
+ value: false
+save_folder:
+ value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+save_interval:
+ value: 500
+save_interval_action_head:
+ value: 500
+save_interval_ephemeral:
+ value: null
+save_interval_unsharded:
+ value: 500
+save_num_action_head_checkpoints_to_keep:
+ value: 2
+save_num_checkpoints_to_keep:
+ value: 1
+save_num_unsharded_checkpoints_to_keep:
+ value: 1
+save_overwrite:
+ value: true
+scheduler:
+ value:
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ grad_clip_warmup_factor: null
+ grad_clip_warmup_steps: null
+ llm_t_warmup: 2000
+ name: multimodal
+ t_max: null
+ t_warmup: 100
+ units: steps
+ vit_t_warmup: 2000
+ warmup_min_lr: 0
+seed:
+ value: 6198
+sharded_checkpointer:
+ value: torch_legacy
+softmax_auxiliary_loss:
+ value: true
+softmax_auxiliary_loss_scale:
+ value: 0.0001
+speed_monitor:
+ value:
+ gpu_flops_available: null
+ window_size: 20
+stop_after:
+ value: null
+stop_at:
+ value: 500000
+time_limit:
+ value: null
+torch_profiling:
+ value: false
+train_exit_random_layer:
+ value: false
+use_lora:
+ value: true
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..2b44baecad2a51d83ba2a4633cd2b77fa06e49e9
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/output.log
@@ -0,0 +1,78 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [07:59:58] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [08:00:00] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+09/24 [08:00:01] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+****** length of the dataset: 17698
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+09/24 [08:00:03] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=True, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Add lora to model.transformer successful!
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* get lora params name: llm_params[0]: blocks.6._fsdp_wrapped_module.att_proj.parametrizations.weight.0.lora_A
+************* After get lora params successfully
+09/24 [08:01:23] INFO | >> Constructing optimizer with 1 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 39071
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=39,071
+09/24 [08:01:24] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+!!!Training failed: AffordVLA.forward() got an unexpected keyword argument 'train_exit_random_layer'
+Traceback (most recent call last):
+ File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 593, in main
+ trainer.fit()
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2324, in fit
+ metrics = self.train_step(batch, reduce_global_loss=should_log_this_step)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2031, in train_step
+ ce_batch_loss, z_batch_loss, batch_accuracy, lb_batch_loss, moe_z_batch_loss, expert_assignments,action_loss = self.train_batch(batch)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 1949, in train_batch
+ accuracy, ce_loss, z_loss, logits, action_loss = self.model_forward(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 1806, in model_forward
+ outputs = self.fsdp_model.forward(
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py", line 854, in forward
+ output = self._fsdp_wrapped_module(*args, **kwargs)
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl
+ return self._call_impl(*args, **kwargs)
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl
+ return forward_call(*args, **kwargs)
+TypeError: AffordVLA.forward() got an unexpected keyword argument 'train_exit_random_layer'
+wandb: WARNING The `quiet` argument to `wandb.run.finish()` is deprecated, use `wandb.Settings(quiet=...)` to set this instead.
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..d591dba0016b7c501858d0d2d84d7b27acfff58c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/requirements.txt
@@ -0,0 +1,285 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..585cfd9d266f36ef26e125702bdc7d2c223c5d02
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T07:59:56.864946Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "768",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "22",
+ "--global_batch_size",
+ "176",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-310",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50870067200"
+ }
+ },
+ "memory": {
+ "total": "2434606936064"
+ },
+ "gpu_amd": [
+ {
+ "id": "1",
+ "uniqueId": "0x51514ecc6ede157",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0xf3ef7b4642ab85b4",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x7f3568312f929f55",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x78c4870668ca6f3c",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xa5b5be8f3bb8ee59",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xd7645877fbcaeda9",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x29dc055d2883ffc3",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0xa98ff96823c37f37",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758959956",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1619",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-310",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758700756",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1619",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-310",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "1391516",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-310",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "89offtg18nkl0daugw7ob6ogc3vo0r47"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/wandb-summary.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/wandb-summary.json
new file mode 100644
index 0000000000000000000000000000000000000000..684644a914dbe0209b573feb258e4a696257bec3
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/files/wandb-summary.json
@@ -0,0 +1 @@
+{"_wandb":{"runtime":86},"_runtime":86.714425509,"_timestamp":1.758700883602961e+09,"_step":0,"System/Peak GPU Memory (MB)":39071.62890625}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/logs/debug-core.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..56ea2ab49af0ee1a6ef62498c37f277f0230c30e
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/logs/debug-core.log
@@ -0,0 +1,16 @@
+{"time":"2025-09-24T07:59:56.919662705Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp91nqx5p7/port-1391594.txt","pid":1391594,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-24T07:59:56.920237123Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":1391594}
+{"time":"2025-09-24T07:59:56.920198313Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-1391594-1391765-820775743/socket","Net":"unix"}}
+{"time":"2025-09-24T07:59:57.103281705Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-24T07:59:57.10780315Z","level":"INFO","msg":"handleInformInit: received","streamId":"zoletkkn","id":"1(@)"}
+{"time":"2025-09-24T07:59:58.229681679Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"zoletkkn","id":"1(@)"}
+{"time":"2025-09-24T08:01:27.309799558Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"zoletkkn","id":"1(@)"}
+{"time":"2025-09-24T08:01:27.313173037Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"zoletkkn","id":"1(@)"}
+{"time":"2025-09-24T08:01:27.313179117Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
+{"time":"2025-09-24T08:01:27.313185547Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
+{"time":"2025-09-24T08:01:27.313192187Z","level":"INFO","msg":"server is shutting down"}
+{"time":"2025-09-24T08:01:27.313195627Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
+{"time":"2025-09-24T08:01:27.313238558Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
+{"time":"2025-09-24T08:01:27.313242268Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
+{"time":"2025-09-24T08:01:27.313286108Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-1391594-1391765-820775743/socket","Net":"unix"}}
+{"time":"2025-09-24T08:01:27.313306649Z","level":"INFO","msg":"server is closed"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..63cc375efca17a8cd6c539a8dc96f58d582e86e1
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/logs/debug-internal.log
@@ -0,0 +1,12 @@
+{"time":"2025-09-24T07:59:57.109651716Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T07:59:58.229629538Z","level":"INFO","msg":"stream: created new stream","id":"zoletkkn"}
+{"time":"2025-09-24T07:59:58.229676109Z","level":"INFO","msg":"stream: started","id":"zoletkkn"}
+{"time":"2025-09-24T07:59:58.229702239Z","level":"INFO","msg":"writer: started","stream_id":"zoletkkn"}
+{"time":"2025-09-24T07:59:58.229705689Z","level":"INFO","msg":"sender: started","stream_id":"zoletkkn"}
+{"time":"2025-09-24T07:59:58.22973716Z","level":"INFO","msg":"handler: started","stream_id":"zoletkkn"}
+{"time":"2025-09-24T08:01:25.265412834Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":1.650757548}],"total_operations":1}}
+{"time":"2025-09-24T08:01:26.944125764Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2025-09-24T08:01:27.310253075Z","level":"INFO","msg":"stream: closing","id":"zoletkkn"}
+{"time":"2025-09-24T08:01:27.310267105Z","level":"INFO","msg":"handler: closed","stream_id":"zoletkkn"}
+{"time":"2025-09-24T08:01:27.311384011Z","level":"INFO","msg":"sender: closed","stream_id":"zoletkkn"}
+{"time":"2025-09-24T08:01:27.311403191Z","level":"INFO","msg":"stream: closed","id":"zoletkkn"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/logs/debug.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/run-zoletkkn.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/run-zoletkkn.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..5679244afe90564c5dd8f6fb347b04ff3235beaa
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_075956-zoletkkn/run-zoletkkn.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/config.yaml b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..54fd71106154088fba1ca92ba9fb84448bcb34c5
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/config.yaml
@@ -0,0 +1,615 @@
+_wandb:
+ value:
+ cli_version: 0.21.4
+ e:
+ jzx8si0l57xezb9k6ob0j3tnnhprupzb:
+ args:
+ - qwen2_7b
+ - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+ - --vision_backbone
+ - openai
+ - --action_head
+ - flow_matching
+ - --seq_len
+ - "768"
+ - --lora_rank
+ - "32"
+ - --lora_llm
+ - --checkpoint
+ - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+ - --device_train_microbatch_size
+ - "22"
+ - --global_batch_size
+ - "176"
+ - --dataset
+ - vla_dataset_realworld
+ - --llm_learning_rate
+ - "5e-5"
+ - --wandb_entity
+ - henryeap
+ - --wandb_project
+ - a1-realworld
+ - --wandb_run_name
+ - glue
+ - --save_overwrite
+ codePath: launch_scripts/train_vla.py
+ codePathLocal: launch_scripts/train_vla.py
+ cpu_count: 64
+ cpu_count_logical: 128
+ disk:
+ /:
+ total: "470343073792"
+ used: "50870210560"
+ email: ihenrykwok@outlook.com
+ executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10
+ git:
+ commit: c13f2763af61e0d729a8b5ab4bdefc512205bcc5
+ remote: https://github.com/Spatialtemporal-AI/A1.git
+ gpu: Instinct MI210
+ gpu_amd:
+ - id: "7"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa98ff96823c37f37"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "0"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x7f3568312f929f55"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "2"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xf3ef7b4642ab85b4"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "3"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x78c4870668ca6f3c"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "4"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xd7645877fbcaeda9"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "5"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x29dc055d2883ffc3"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "6"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa5b5be8f3bb8ee59"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "1"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x51514ecc6ede157"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ gpu_count: 8
+ host: auh7-1b-gpu-310
+ memory:
+ total: "2434606936064"
+ os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35
+ program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py
+ python: CPython 3.10.18
+ root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb
+ slurm:
+ cluster_name: ai-04r
+ conf: /etc/slurm/slurm.conf
+ cpus_on_node: "128"
+ gpus_on_node: "8"
+ gtids: "0"
+ job_account: faculty-acc
+ job_cpus_per_node: "128"
+ job_end_time: "1758960307"
+ job_gid: "2000"
+ job_gpus: 0,1,2,3,4,5,6,7
+ job_id: "1620"
+ job_name: realworld_mh
+ job_nodelist: auh7-1b-gpu-310
+ job_num_nodes: "1"
+ job_partition: faculty
+ job_qos: xdqos
+ job_start_time: "1758701107"
+ job_uid: "2013"
+ job_user: xiaodan
+ jobid: "1620"
+ localid: "0"
+ nnodes: "1"
+ nodeid: "0"
+ nodelist: auh7-1b-gpu-310
+ nprocs: "1"
+ ntasks: "1"
+ ntasks_per_node: "1"
+ oom_kill_step: "0"
+ prio_process: "0"
+ procid: "0"
+ submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts
+ submit_host: auh-1b-cpu-login-001
+ task_pid: "1393644"
+ tasks_per_node: "1"
+ topology_addr: auh7-1b-gpu-310
+ topology_addr_pattern: node
+ startedAt: "2025-09-24T08:05:45.097162Z"
+ writerId: jzx8si0l57xezb9k6ob0j3tnnhprupzb
+ m: []
+ python_version: 3.10.18
+ t:
+ "1":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "2":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "3":
+ - 2
+ - 13
+ - 15
+ - 16
+ - 61
+ "4": 3.10.18
+ "5": 0.21.4
+ "6": 4.56.1
+ "10":
+ - 19
+ "12": 0.21.4
+ "13": linux-x86_64
+activation_checkpointing:
+ value: whole_layer
+allow_resume:
+ value: false
+batch_divisor:
+ value: global_batch
+canceled_check_interval:
+ value: 50
+checkpoint_dir:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+compile:
+ value: null
+console_log_interval:
+ value: 1
+data:
+ value:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: null
+ lerobot_episode_index_start: null
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: false
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: 95818
+ sequence_length: 768
+ shuffle: true
+ shuffle_messages: false
+ split: train
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+device_eval_batch_size:
+ value: 4
+device_inf_eval_batch_size:
+ value: 16
+device_train_batch_size:
+ value: 22
+device_train_grad_accum:
+ value: 1
+device_train_microbatch_size:
+ value: 22
+dry_run:
+ value: false
+early_exit:
+ value: false
+epoch:
+ value: null
+eval_interval:
+ value: 0
+eval_on_load:
+ value: false
+eval_subset_num_batches:
+ value: -1
+evaluators:
+ value:
+ - data:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: 765
+ lerobot_episode_index_start: 353
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: true
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: null
+ sequence_length: 768
+ shuffle: false
+ shuffle_messages: false
+ split: validation
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+ device_eval_batch_size: null
+ eval_name: null
+ label: val
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ skip_if_metrics_cached: true
+ subset_num_batches: 64
+extra_steps_after_cancel:
+ value: 10
+fast_forward_batches:
+ value: null
+force_save_unsharded:
+ value: false
+fsdp:
+ value:
+ hybrid_sharding_num_model_replicas: null
+ precision: float
+ sharding_strategy: FULL_SHARD
+ use_orig_params: true
+ wrapping_strategy: by_block_and_size
+ft_connector:
+ value: false
+ft_embedding:
+ value: lm_head
+ft_llm:
+ value: false
+ft_vit:
+ value: false
+fused_loss:
+ value: null
+gen1_gc_interval:
+ value: 1
+global_train_batch_size:
+ value: 176
+inf_eval_interval:
+ value: -1
+inf_eval_subset_num_batches:
+ value: -1
+inf_evaluators:
+ value: []
+initial_model_checkpoint:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+keep_lr_on_load:
+ value: true
+load_model_config:
+ value: null
+load_path:
+ value: null
+load_path_sharded_checkpointer:
+ value: null
+lora:
+ value: false
+lora_connector:
+ value: false
+lora_llm:
+ value: true
+lora_rank:
+ value: 32
+lora_vit:
+ value: false
+max_duration:
+ value: 500000
+max_grad_norm:
+ value: 1
+max_grad_norm_ratio:
+ value: null
+model:
+ value:
+ action_head: flow_matching
+ action_head_dit_depth: 28
+ action_head_dit_hidden_size: 1152
+ action_head_dit_num_heads: 16
+ action_use_left_eef: false
+ action_use_mobile_base: false
+ activation_type: swiglu
+ additional_vocab_size: 128
+ always_start_with_space: true
+ attention_dropout: 0
+ attention_layer_norm: false
+ attention_layer_norm_with_affine: true
+ attention_type: sdpa
+ bias_for_layer_norm: null
+ block_group_size: 1
+ block_type: sequential
+ clip_qkv: null
+ crop_mode: overlap-and-resize-c2
+ d_model: 3584
+ default_inference_len: 65
+ embedding_dropout: 0
+ embedding_size: 152064
+ fix_image_padding: true
+ float32_attention: true
+ head_dim: null
+ image_feature_dropout: 0
+ image_padding_embed: pad_and_partial_pad
+ image_pooling_2d: attention_meanq
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_projector: mlp
+ include_bias: false
+ init_cutoff_factor: null
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ initializer_range: 0.02
+ layer_norm_eps: 1e-06
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ llm_causal_attention: false
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ max_crops: 12
+ max_position_embeddings: null
+ max_sequence_length: 4096
+ message_formatting: role
+ mlp_hidden_size: 37888
+ mlp_ratio: 4
+ moe_capacity_factor: 1.25
+ moe_dropless: true
+ moe_interleave: false
+ moe_lbl_in_fp32: false
+ moe_log_expert_assignment: false
+ moe_loss_weight: 0.1
+ moe_mlp_impl: sparse
+ moe_num_experts: 8
+ moe_shared_expert: false
+ moe_top_k: 2
+ moe_zloss_weight: null
+ multi_annotation_weighting: root_subsegments
+ n_heads: 28
+ n_kv_heads: 4
+ n_layers: 28
+ new_embedding_init_range: 0.02
+ norm_after: false
+ normalize_input_embeds: false
+ num_diffusion_inference_steps: 30
+ num_diffusion_steps: 1000
+ overlap_margins:
+ - 4
+ - 4
+ pad_tokenizer: true
+ pad_value: 0
+ precision: amp_bf16
+ prompt_type: uber_model
+ qkv_bias: true
+ residual_dropout: 0.1
+ response_residual_dropout: 0
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1e+06
+ scale_logits: false
+ system_prompt_kind: demo_or_style
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ use_col_tokens: true
+ use_position_ids: true
+ use_proprio: true
+ vision_backbone:
+ attention_dropout: 0
+ fsdp_wrap: false
+ image_default_input_size:
+ - 336
+ - 336
+ image_dropout_rate: 0
+ image_emb_dim: 1024
+ image_head_dim: 64
+ image_mlp_activations: quick_gelu
+ image_mlp_dim: 4096
+ image_model_type: openai
+ image_norm_eps: 1e-05
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_num_pos: 577
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ initializer_range: 0.02
+ residual_dropout: 0
+ resize_mode: default
+ vit_layers:
+ - -2
+ - -9
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ vocab_size: 152064
+ weight_tying: false
+multi_component_grad_norm:
+ value: true
+no_pre_train_checkpoint:
+ value: true
+optimizer:
+ value:
+ betas:
+ - 0.9
+ - 0.95
+ connector_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1e-06
+ connector_learning_rate: 0.0002
+ connector_weight_decay: 0
+ eps: 1e-05
+ learning_rate: 0.0001
+ llm_betas:
+ - 0.9
+ - 0.95
+ llm_eps: 1e-06
+ llm_learning_rate: 5e-05
+ llm_weight_decay: 0
+ metrics_log_interval: 20
+ name: adamw
+ vit_betas:
+ - 0.9
+ - 0.95
+ vit_eps: 1e-06
+ vit_learning_rate: 6e-06
+ vit_weight_decay: 0
+ weight_decay: 0.01
+precision:
+ value: amp_bf16
+python_profiling:
+ value: false
+remote_save_folder:
+ value: null
+reset_dataloader_state:
+ value: false
+reset_optimizer_state:
+ value: false
+reset_trainer_state:
+ value: false
+restore_dataloader:
+ value: true
+run_name:
+ value: glue_20250924_080517
+save_dataloader_state:
+ value: false
+save_folder:
+ value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+save_interval:
+ value: 500
+save_interval_action_head:
+ value: 500
+save_interval_ephemeral:
+ value: null
+save_interval_unsharded:
+ value: 500
+save_num_action_head_checkpoints_to_keep:
+ value: 2
+save_num_checkpoints_to_keep:
+ value: 1
+save_num_unsharded_checkpoints_to_keep:
+ value: 1
+save_overwrite:
+ value: true
+scheduler:
+ value:
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ grad_clip_warmup_factor: null
+ grad_clip_warmup_steps: null
+ llm_t_warmup: 2000
+ name: multimodal
+ t_max: null
+ t_warmup: 100
+ units: steps
+ vit_t_warmup: 2000
+ warmup_min_lr: 0
+seed:
+ value: 6198
+sharded_checkpointer:
+ value: torch_legacy
+softmax_auxiliary_loss:
+ value: true
+softmax_auxiliary_loss_scale:
+ value: 0.0001
+speed_monitor:
+ value:
+ gpu_flops_available: null
+ window_size: 20
+stop_after:
+ value: null
+stop_at:
+ value: 500000
+time_limit:
+ value: null
+torch_profiling:
+ value: false
+train_exit_random_layer:
+ value: false
+use_lora:
+ value: true
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..404c02c62817281bdd00bd7898725e59dc370d2b
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/output.log
@@ -0,0 +1,80 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [08:05:47] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [08:05:49] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+ INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+****** length of the dataset: 17698
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+09/24 [08:05:51] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=True, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Add lora to model.transformer successful!
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* get lora params name: llm_params[0]: blocks.9._fsdp_wrapped_module.att_proj.parametrizations.weight.0.lora_A
+************* After get lora params successfully
+09/24 [08:07:09] INFO | >> Constructing optimizer with 1 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 39071
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=39,071
+09/24 [08:07:10] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+!!!Training failed: index 963 is out of bounds for dimension 1 with size 768
+Traceback (most recent call last):
+ File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 593, in main
+ trainer.fit()
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2324, in fit
+ metrics = self.train_step(batch, reduce_global_loss=should_log_this_step)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2031, in train_step
+ ce_batch_loss, z_batch_loss, batch_accuracy, lb_batch_loss, moe_z_batch_loss, expert_assignments,action_loss = self.train_batch(batch)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 1949, in train_batch
+ accuracy, ce_loss, z_loss, logits, action_loss = self.model_forward(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 1806, in model_forward
+ outputs = self.fsdp_model.forward(
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py", line 854, in forward
+ output = self._fsdp_wrapped_module(*args, **kwargs)
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl
+ return self._call_impl(*args, **kwargs)
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl
+ return forward_call(*args, **kwargs)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/vla/affordvla.py", line 817, in forward
+ x[:,proprio_token_idx[0],:] = proprio_features.squeeze()
+IndexError: index 963 is out of bounds for dimension 1 with size 768
+wandb: WARNING The `quiet` argument to `wandb.run.finish()` is deprecated, use `wandb.Settings(quiet=...)` to set this instead.
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..d591dba0016b7c501858d0d2d84d7b27acfff58c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/requirements.txt
@@ -0,0 +1,285 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..bf2f8ae0aab89608c65d3b4f09eed869918ed388
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T08:05:45.097162Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "768",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "22",
+ "--global_batch_size",
+ "176",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-310",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50870210560"
+ }
+ },
+ "memory": {
+ "total": "2434606936064"
+ },
+ "gpu_amd": [
+ {
+ "id": "7",
+ "uniqueId": "0xa98ff96823c37f37",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x7f3568312f929f55",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0xf3ef7b4642ab85b4",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x78c4870668ca6f3c",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xd7645877fbcaeda9",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x29dc055d2883ffc3",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xa5b5be8f3bb8ee59",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0x51514ecc6ede157",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758960307",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1620",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-310",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758701107",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1620",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-310",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "1393644",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-310",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "jzx8si0l57xezb9k6ob0j3tnnhprupzb"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/wandb-summary.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/wandb-summary.json
new file mode 100644
index 0000000000000000000000000000000000000000..5358d14f0b0e343741eb247ba2b2523f7de1dc99
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/files/wandb-summary.json
@@ -0,0 +1 @@
+{"System/Peak GPU Memory (MB)":39071.62890625,"_wandb":{"runtime":84},"_runtime":84.515978221,"_timestamp":1.758701229397748e+09,"_step":0}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/logs/debug-core.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..82b998f8bf6aa70fadc6a91cebb03487ddb26451
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/logs/debug-core.log
@@ -0,0 +1,16 @@
+{"time":"2025-09-24T08:05:45.147407358Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp8yo_j3ql/port-1393722.txt","pid":1393722,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-24T08:05:45.148011766Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":1393722}
+{"time":"2025-09-24T08:05:45.147993566Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-1393722-1393887-36962336/socket","Net":"unix"}}
+{"time":"2025-09-24T08:05:45.331440004Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-24T08:05:45.338336553Z","level":"INFO","msg":"handleInformInit: received","streamId":"o2pw3uj2","id":"1(@)"}
+{"time":"2025-09-24T08:05:46.532294827Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"o2pw3uj2","id":"1(@)"}
+{"time":"2025-09-24T08:07:13.614685833Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"o2pw3uj2","id":"1(@)"}
+{"time":"2025-09-24T08:07:13.618199374Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"o2pw3uj2","id":"1(@)"}
+{"time":"2025-09-24T08:07:13.618205734Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
+{"time":"2025-09-24T08:07:13.618214184Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
+{"time":"2025-09-24T08:07:13.618221274Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
+{"time":"2025-09-24T08:07:13.618231334Z","level":"INFO","msg":"server is shutting down"}
+{"time":"2025-09-24T08:07:13.618245635Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
+{"time":"2025-09-24T08:07:13.618283025Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
+{"time":"2025-09-24T08:07:13.618417467Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-1393722-1393887-36962336/socket","Net":"unix"}}
+{"time":"2025-09-24T08:07:13.618454238Z","level":"INFO","msg":"server is closed"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..c429b098c580a75c25caffe7b2bbe383772a5c70
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/logs/debug-internal.log
@@ -0,0 +1,12 @@
+{"time":"2025-09-24T08:05:45.340327622Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T08:05:46.532247566Z","level":"INFO","msg":"stream: created new stream","id":"o2pw3uj2"}
+{"time":"2025-09-24T08:05:46.532289117Z","level":"INFO","msg":"stream: started","id":"o2pw3uj2"}
+{"time":"2025-09-24T08:05:46.532308677Z","level":"INFO","msg":"writer: started","stream_id":"o2pw3uj2"}
+{"time":"2025-09-24T08:05:46.532315867Z","level":"INFO","msg":"handler: started","stream_id":"o2pw3uj2"}
+{"time":"2025-09-24T08:05:46.532345608Z","level":"INFO","msg":"sender: started","stream_id":"o2pw3uj2"}
+{"time":"2025-09-24T08:07:11.483037395Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":2.084611044}],"total_operations":1}}
+{"time":"2025-09-24T08:07:13.15779756Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2025-09-24T08:07:13.615091449Z","level":"INFO","msg":"stream: closing","id":"o2pw3uj2"}
+{"time":"2025-09-24T08:07:13.615103709Z","level":"INFO","msg":"handler: closed","stream_id":"o2pw3uj2"}
+{"time":"2025-09-24T08:07:13.616414408Z","level":"INFO","msg":"sender: closed","stream_id":"o2pw3uj2"}
+{"time":"2025-09-24T08:07:13.616431988Z","level":"INFO","msg":"stream: closed","id":"o2pw3uj2"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/logs/debug.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/run-o2pw3uj2.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/run-o2pw3uj2.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..82ce3ba0714fd479f6a954fff68b1cb7e379dd70
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_080545-o2pw3uj2/run-o2pw3uj2.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/config.yaml b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..39879d24015c036bf611c11e126a92377bfd3316
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/config.yaml
@@ -0,0 +1,615 @@
+_wandb:
+ value:
+ cli_version: 0.21.4
+ e:
+ 71773rlly0etrjwxrtco2c8pzrqnc7wl:
+ args:
+ - qwen2_7b
+ - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+ - --vision_backbone
+ - openai
+ - --action_head
+ - flow_matching
+ - --seq_len
+ - "1024"
+ - --lora_rank
+ - "32"
+ - --lora_llm
+ - --checkpoint
+ - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+ - --device_train_microbatch_size
+ - "22"
+ - --global_batch_size
+ - "176"
+ - --dataset
+ - vla_dataset_realworld
+ - --llm_learning_rate
+ - "5e-5"
+ - --wandb_entity
+ - henryeap
+ - --wandb_project
+ - a1-realworld
+ - --wandb_run_name
+ - glue
+ - --save_overwrite
+ codePath: launch_scripts/train_vla.py
+ codePathLocal: launch_scripts/train_vla.py
+ cpu_count: 64
+ cpu_count_logical: 128
+ disk:
+ /:
+ total: "470343073792"
+ used: "50870362112"
+ email: ihenrykwok@outlook.com
+ executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10
+ git:
+ commit: c13f2763af61e0d729a8b5ab4bdefc512205bcc5
+ remote: https://github.com/Spatialtemporal-AI/A1.git
+ gpu: Instinct MI210
+ gpu_amd:
+ - id: "0"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x7f3568312f929f55"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "7"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa98ff96823c37f37"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "5"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x29dc055d2883ffc3"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "4"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xd7645877fbcaeda9"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "2"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xf3ef7b4642ab85b4"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "6"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0xa5b5be8f3bb8ee59"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "1"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x51514ecc6ede157"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ - id: "3"
+ maxPower: "300.0"
+ mclkRange: 400Mhz - 1600Mhz
+ model: "0x740f"
+ performanceLevel: auto
+ sclkRange: 500Mhz - 1700Mhz
+ series: Instinct MI210
+ sku: D67301V
+ uniqueId: "0x78c4870668ca6f3c"
+ vbiosVersion: 113-D67301V-073
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
+ gpu_count: 8
+ host: auh7-1b-gpu-310
+ memory:
+ total: "2434606936064"
+ os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35
+ program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py
+ python: CPython 3.10.18
+ root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb
+ slurm:
+ cluster_name: ai-04r
+ conf: /etc/slurm/slurm.conf
+ cpus_on_node: "128"
+ gpus_on_node: "8"
+ gtids: "0"
+ job_account: faculty-acc
+ job_cpus_per_node: "128"
+ job_end_time: "1758960687"
+ job_gid: "2000"
+ job_gpus: 0,1,2,3,4,5,6,7
+ job_id: "1621"
+ job_name: realworld_mh
+ job_nodelist: auh7-1b-gpu-310
+ job_num_nodes: "1"
+ job_partition: faculty
+ job_qos: xdqos
+ job_start_time: "1758701487"
+ job_uid: "2013"
+ job_user: xiaodan
+ jobid: "1621"
+ localid: "0"
+ nnodes: "1"
+ nodeid: "0"
+ nodelist: auh7-1b-gpu-310
+ nprocs: "1"
+ ntasks: "1"
+ ntasks_per_node: "1"
+ oom_kill_step: "0"
+ prio_process: "0"
+ procid: "0"
+ submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts
+ submit_host: auh-1b-cpu-login-001
+ task_pid: "1395749"
+ tasks_per_node: "1"
+ topology_addr: auh7-1b-gpu-310
+ topology_addr_pattern: node
+ startedAt: "2025-09-24T08:12:05.038967Z"
+ writerId: 71773rlly0etrjwxrtco2c8pzrqnc7wl
+ m: []
+ python_version: 3.10.18
+ t:
+ "1":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "2":
+ - 1
+ - 3
+ - 5
+ - 11
+ - 41
+ - 49
+ - 51
+ - 53
+ - 63
+ - 71
+ - 83
+ - 95
+ - 105
+ "3":
+ - 2
+ - 13
+ - 15
+ - 16
+ - 61
+ "4": 3.10.18
+ "5": 0.21.4
+ "6": 4.56.1
+ "10":
+ - 19
+ "12": 0.21.4
+ "13": linux-x86_64
+activation_checkpointing:
+ value: whole_layer
+allow_resume:
+ value: false
+batch_divisor:
+ value: global_batch
+canceled_check_interval:
+ value: 50
+checkpoint_dir:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+compile:
+ value: null
+console_log_interval:
+ value: 1
+data:
+ value:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: null
+ lerobot_episode_index_start: null
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: false
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: 95818
+ sequence_length: 1024
+ shuffle: true
+ shuffle_messages: false
+ split: train
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+device_eval_batch_size:
+ value: 4
+device_inf_eval_batch_size:
+ value: 16
+device_train_batch_size:
+ value: 22
+device_train_grad_accum:
+ value: 1
+device_train_microbatch_size:
+ value: 22
+dry_run:
+ value: false
+early_exit:
+ value: false
+epoch:
+ value: null
+eval_interval:
+ value: 0
+eval_on_load:
+ value: false
+eval_subset_num_batches:
+ value: -1
+evaluators:
+ value:
+ - data:
+ dataset: vla_dataset_realworld
+ drop_last: true
+ for_inference: false
+ lerobot_episode_index_end: 765
+ lerobot_episode_index_start: 353
+ mixture: null
+ multi_modal: torch
+ num_workers: 0
+ pad: to_max
+ persistent_workers: true
+ pin_memory: true
+ prefetch_factor: null
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_read_threads: 8
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ root_size_mixture: null
+ seed: null
+ sequence_length: 1024
+ shuffle: false
+ shuffle_messages: false
+ split: validation
+ timeout: 0
+ use_proprio: true
+ use_wrist_image: true
+ device_eval_batch_size: null
+ eval_name: null
+ label: val
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ skip_if_metrics_cached: true
+ subset_num_batches: 64
+extra_steps_after_cancel:
+ value: 10
+fast_forward_batches:
+ value: null
+force_save_unsharded:
+ value: false
+fsdp:
+ value:
+ hybrid_sharding_num_model_replicas: null
+ precision: float
+ sharding_strategy: FULL_SHARD
+ use_orig_params: true
+ wrapping_strategy: by_block_and_size
+ft_connector:
+ value: false
+ft_embedding:
+ value: lm_head
+ft_llm:
+ value: false
+ft_vit:
+ value: false
+fused_loss:
+ value: null
+gen1_gc_interval:
+ value: 1
+global_train_batch_size:
+ value: 176
+inf_eval_interval:
+ value: -1
+inf_eval_subset_num_batches:
+ value: -1
+inf_evaluators:
+ value: []
+initial_model_checkpoint:
+ value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+keep_lr_on_load:
+ value: true
+load_model_config:
+ value: null
+load_path:
+ value: null
+load_path_sharded_checkpointer:
+ value: null
+lora:
+ value: false
+lora_connector:
+ value: false
+lora_llm:
+ value: true
+lora_rank:
+ value: 32
+lora_vit:
+ value: false
+max_duration:
+ value: 500000
+max_grad_norm:
+ value: 1
+max_grad_norm_ratio:
+ value: null
+model:
+ value:
+ action_head: flow_matching
+ action_head_dit_depth: 28
+ action_head_dit_hidden_size: 1152
+ action_head_dit_num_heads: 16
+ action_use_left_eef: false
+ action_use_mobile_base: false
+ activation_type: swiglu
+ additional_vocab_size: 128
+ always_start_with_space: true
+ attention_dropout: 0
+ attention_layer_norm: false
+ attention_layer_norm_with_affine: true
+ attention_type: sdpa
+ bias_for_layer_norm: null
+ block_group_size: 1
+ block_type: sequential
+ clip_qkv: null
+ crop_mode: overlap-and-resize-c2
+ d_model: 3584
+ default_inference_len: 65
+ embedding_dropout: 0
+ embedding_size: 152064
+ fix_image_padding: true
+ float32_attention: true
+ head_dim: null
+ image_feature_dropout: 0
+ image_padding_embed: pad_and_partial_pad
+ image_pooling_2d: attention_meanq
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_projector: mlp
+ include_bias: false
+ init_cutoff_factor: null
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ initializer_range: 0.02
+ layer_norm_eps: 1e-06
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ llm_causal_attention: false
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ max_crops: 12
+ max_position_embeddings: null
+ max_sequence_length: 4096
+ message_formatting: role
+ mlp_hidden_size: 37888
+ mlp_ratio: 4
+ moe_capacity_factor: 1.25
+ moe_dropless: true
+ moe_interleave: false
+ moe_lbl_in_fp32: false
+ moe_log_expert_assignment: false
+ moe_loss_weight: 0.1
+ moe_mlp_impl: sparse
+ moe_num_experts: 8
+ moe_shared_expert: false
+ moe_top_k: 2
+ moe_zloss_weight: null
+ multi_annotation_weighting: root_subsegments
+ n_heads: 28
+ n_kv_heads: 4
+ n_layers: 28
+ new_embedding_init_range: 0.02
+ norm_after: false
+ normalize_input_embeds: false
+ num_diffusion_inference_steps: 30
+ num_diffusion_steps: 1000
+ overlap_margins:
+ - 4
+ - 4
+ pad_tokenizer: true
+ pad_value: 0
+ precision: amp_bf16
+ prompt_type: uber_model
+ qkv_bias: true
+ residual_dropout: 0.1
+ response_residual_dropout: 0
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1e+06
+ scale_logits: false
+ system_prompt_kind: demo_or_style
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ use_col_tokens: true
+ use_position_ids: true
+ use_proprio: true
+ vision_backbone:
+ attention_dropout: 0
+ fsdp_wrap: false
+ image_default_input_size:
+ - 336
+ - 336
+ image_dropout_rate: 0
+ image_emb_dim: 1024
+ image_head_dim: 64
+ image_mlp_activations: quick_gelu
+ image_mlp_dim: 4096
+ image_model_type: openai
+ image_norm_eps: 1e-05
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_num_pos: 577
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ initializer_range: 0.02
+ residual_dropout: 0
+ resize_mode: default
+ vit_layers:
+ - -2
+ - -9
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ vocab_size: 152064
+ weight_tying: false
+multi_component_grad_norm:
+ value: true
+no_pre_train_checkpoint:
+ value: true
+optimizer:
+ value:
+ betas:
+ - 0.9
+ - 0.95
+ connector_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1e-06
+ connector_learning_rate: 0.0002
+ connector_weight_decay: 0
+ eps: 1e-05
+ learning_rate: 0.0001
+ llm_betas:
+ - 0.9
+ - 0.95
+ llm_eps: 1e-06
+ llm_learning_rate: 5e-05
+ llm_weight_decay: 0
+ metrics_log_interval: 20
+ name: adamw
+ vit_betas:
+ - 0.9
+ - 0.95
+ vit_eps: 1e-06
+ vit_learning_rate: 6e-06
+ vit_weight_decay: 0
+ weight_decay: 0.01
+precision:
+ value: amp_bf16
+python_profiling:
+ value: false
+remote_save_folder:
+ value: null
+reset_dataloader_state:
+ value: false
+reset_optimizer_state:
+ value: false
+reset_trainer_state:
+ value: false
+restore_dataloader:
+ value: true
+run_name:
+ value: glue_20250924_081136
+save_dataloader_state:
+ value: false
+save_folder:
+ value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt
+save_interval:
+ value: 500
+save_interval_action_head:
+ value: 500
+save_interval_ephemeral:
+ value: null
+save_interval_unsharded:
+ value: 500
+save_num_action_head_checkpoints_to_keep:
+ value: 2
+save_num_checkpoints_to_keep:
+ value: 1
+save_num_unsharded_checkpoints_to_keep:
+ value: 1
+save_overwrite:
+ value: true
+scheduler:
+ value:
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ grad_clip_warmup_factor: null
+ grad_clip_warmup_steps: null
+ llm_t_warmup: 2000
+ name: multimodal
+ t_max: null
+ t_warmup: 100
+ units: steps
+ vit_t_warmup: 2000
+ warmup_min_lr: 0
+seed:
+ value: 6198
+sharded_checkpointer:
+ value: torch_legacy
+softmax_auxiliary_loss:
+ value: true
+softmax_auxiliary_loss_scale:
+ value: 0.0001
+speed_monitor:
+ value:
+ gpu_flops_available: null
+ window_size: 20
+stop_after:
+ value: null
+stop_at:
+ value: 500000
+time_limit:
+ value: null
+torch_profiling:
+ value: false
+train_exit_random_layer:
+ value: false
+use_lora:
+ value: true
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..c623e2980bb26c521f7e84ab7645a844ae0b67e8
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/output.log
@@ -0,0 +1,82 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [08:12:07] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [08:12:08] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+09/24 [08:12:09] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+****** length of the dataset: 17698
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+09/24 [08:12:11] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=True, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Add lora to model.transformer successful!
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* get lora params name: llm_params[0]: blocks.10._fsdp_wrapped_module.attn_out.parametrizations.weight.0.lora_B
+************* After get lora params successfully
+09/24 [08:13:28] INFO | >> Constructing optimizer with 1 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 39071
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=39,071
+09/24 [08:13:29] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+!!!Training failed: Action start pos 965 and end positions -1 must be valid indices in the input sequence
+Traceback (most recent call last):
+ File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 593, in main
+ trainer.fit()
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2324, in fit
+ metrics = self.train_step(batch, reduce_global_loss=should_log_this_step)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2031, in train_step
+ ce_batch_loss, z_batch_loss, batch_accuracy, lb_batch_loss, moe_z_batch_loss, expert_assignments,action_loss = self.train_batch(batch)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 1949, in train_batch
+ accuracy, ce_loss, z_loss, logits, action_loss = self.model_forward(
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 1806, in model_forward
+ outputs = self.fsdp_model.forward(
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py", line 854, in forward
+ output = self._fsdp_wrapped_module(*args, **kwargs)
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl
+ return self._call_impl(*args, **kwargs)
+ File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl
+ return forward_call(*args, **kwargs)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/vla/affordvla.py", line 1039, in forward
+ action_hidden_states = self.extract_action_hidden_states(last_hidden_state, input_ids)
+ File "/vast/users/xiaodan/zhangjian/A1/olmo/vla/affordvla.py", line 282, in extract_action_hidden_states
+ assert end_idx>0 and start_idx>=0, f"Action start pos {start_idx} and end positions {end_idx} must be valid indices in the input sequence"
+AssertionError: Action start pos 965 and end positions -1 must be valid indices in the input sequence
+wandb: WARNING The `quiet` argument to `wandb.run.finish()` is deprecated, use `wandb.Settings(quiet=...)` to set this instead.
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..d591dba0016b7c501858d0d2d84d7b27acfff58c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/requirements.txt
@@ -0,0 +1,285 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..a1cf96214fb20e98a44f44a9fbc416ede9767ae4
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T08:12:05.038967Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "1024",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "22",
+ "--global_batch_size",
+ "176",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-310",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50870362112"
+ }
+ },
+ "memory": {
+ "total": "2434606936064"
+ },
+ "gpu_amd": [
+ {
+ "id": "0",
+ "uniqueId": "0x7f3568312f929f55",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0xa98ff96823c37f37",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x29dc055d2883ffc3",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xd7645877fbcaeda9",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0xf3ef7b4642ab85b4",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xa5b5be8f3bb8ee59",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0x51514ecc6ede157",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x78c4870668ca6f3c",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758960687",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1621",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-310",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758701487",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1621",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-310",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "1395749",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-310",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "71773rlly0etrjwxrtco2c8pzrqnc7wl"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/wandb-summary.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/wandb-summary.json
new file mode 100644
index 0000000000000000000000000000000000000000..0218d9fe3949091450ed8b0bfdd899138b035cfb
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/files/wandb-summary.json
@@ -0,0 +1 @@
+{"System/Peak GPU Memory (MB)":39071.62890625,"_timestamp":1.758701608529476e+09,"_step":0,"_wandb":{"runtime":90},"_runtime":90.244994632}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/logs/debug-core.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..1cb37f2a27c84302b237509c9ca67473f96dbbd8
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/logs/debug-core.log
@@ -0,0 +1,16 @@
+{"time":"2025-09-24T08:12:05.089914727Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpv0416bdr/port-1395827.txt","pid":1395827,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-24T08:12:05.090327263Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":1395827}
+{"time":"2025-09-24T08:12:05.090314043Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-1395827-1396213-2359412859/socket","Net":"unix"}}
+{"time":"2025-09-24T08:12:05.274415601Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-24T08:12:05.281627106Z","level":"INFO","msg":"handleInformInit: received","streamId":"s84jc1wj","id":"1(@)"}
+{"time":"2025-09-24T08:12:06.403399953Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"s84jc1wj","id":"1(@)"}
+{"time":"2025-09-24T08:13:38.840845915Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"s84jc1wj","id":"1(@)"}
+{"time":"2025-09-24T08:13:38.844156043Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"s84jc1wj","id":"1(@)"}
+{"time":"2025-09-24T08:13:38.844160353Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
+{"time":"2025-09-24T08:13:38.844165893Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
+{"time":"2025-09-24T08:13:38.844171833Z","level":"INFO","msg":"server is shutting down"}
+{"time":"2025-09-24T08:13:38.844170943Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
+{"time":"2025-09-24T08:13:38.844197873Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
+{"time":"2025-09-24T08:13:38.844201153Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
+{"time":"2025-09-24T08:13:38.844239534Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-1395827-1396213-2359412859/socket","Net":"unix"}}
+{"time":"2025-09-24T08:13:38.844257354Z","level":"INFO","msg":"server is closed"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..ff81c6e8a65a487d7864e6a579022583f72be7c9
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/logs/debug-internal.log
@@ -0,0 +1,12 @@
+{"time":"2025-09-24T08:12:05.283670566Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T08:12:06.403354463Z","level":"INFO","msg":"stream: created new stream","id":"s84jc1wj"}
+{"time":"2025-09-24T08:12:06.403394923Z","level":"INFO","msg":"stream: started","id":"s84jc1wj"}
+{"time":"2025-09-24T08:12:06.403399293Z","level":"INFO","msg":"handler: started","stream_id":"s84jc1wj"}
+{"time":"2025-09-24T08:12:06.403404383Z","level":"INFO","msg":"sender: started","stream_id":"s84jc1wj"}
+{"time":"2025-09-24T08:12:06.403423244Z","level":"INFO","msg":"writer: started","stream_id":"s84jc1wj"}
+{"time":"2025-09-24T08:13:37.504606863Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"uploading console lines 35-80","runtime_seconds":0.220497353},{"desc":"updating run metadata","runtime_seconds":0.177773298}],"total_operations":2}}
+{"time":"2025-09-24T08:13:38.49640708Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2025-09-24T08:13:38.84121277Z","level":"INFO","msg":"stream: closing","id":"s84jc1wj"}
+{"time":"2025-09-24T08:13:38.84122466Z","level":"INFO","msg":"handler: closed","stream_id":"s84jc1wj"}
+{"time":"2025-09-24T08:13:38.84257624Z","level":"INFO","msg":"sender: closed","stream_id":"s84jc1wj"}
+{"time":"2025-09-24T08:13:38.84258484Z","level":"INFO","msg":"stream: closed","id":"s84jc1wj"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/logs/debug.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/run-s84jc1wj.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/run-s84jc1wj.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..4f937a466b22d3e156b9c5be8bddabec1b69c676
Binary files /dev/null and b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081205-s84jc1wj/run-s84jc1wj.wandb differ
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..0409a943dac334e8ac14f210b3ef3224edb873ee
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/output.log
@@ -0,0 +1,66 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [08:17:25] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [08:17:26] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+09/24 [08:17:27] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+****** length of the dataset: 17698
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+09/24 [08:17:29] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=True, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Add lora to model.transformer successful!
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* get lora params name: llm_params[0]: blocks.17._fsdp_wrapped_module.ff_out.parametrizations.weight.0.lora_A
+************* After get lora params successfully
+09/24 [08:18:47] INFO | >> Constructing optimizer with 1 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 39071
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=39,071
+ WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+09/24 [08:18:58] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109
+ of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed
+ want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor
+ by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered
+ internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.)
+ param_grad = param.grad
+
+!!!Training failed: NCCL communicator was aborted on rank 0.
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..d591dba0016b7c501858d0d2d84d7b27acfff58c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/requirements.txt
@@ -0,0 +1,285 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..aeee136d9db367d7dd23bb999ad32e1f6da0434e
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T08:17:23.081896Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "1600",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "22",
+ "--global_batch_size",
+ "176",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-310",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50870501376"
+ }
+ },
+ "memory": {
+ "total": "2434606936064"
+ },
+ "gpu_amd": [
+ {
+ "id": "1",
+ "uniqueId": "0x51514ecc6ede157",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x78c4870668ca6f3c",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0xa98ff96823c37f37",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xd7645877fbcaeda9",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0xf3ef7b4642ab85b4",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xa5b5be8f3bb8ee59",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x7f3568312f929f55",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x29dc055d2883ffc3",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758961004",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1622",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-310",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758701804",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1622",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-310",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "1398012",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-310",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "j2b8i27td0wcxqgodk1fx9zhxbxnu6k4"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/logs/debug-core.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..181ee22be6b267ecb93d039bd9cee52db929f632
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/logs/debug-core.log
@@ -0,0 +1,7 @@
+{"time":"2025-09-24T08:17:23.133965584Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpx6ifjex2/port-1398166.txt","pid":1398166,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-24T08:17:23.134463341Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":1398166}
+{"time":"2025-09-24T08:17:23.134454481Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-1398166-1398334-1389690679/socket","Net":"unix"}}
+{"time":"2025-09-24T08:17:23.317462701Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-24T08:17:23.324378323Z","level":"INFO","msg":"handleInformInit: received","streamId":"x94cyrsz","id":"1(@)"}
+{"time":"2025-09-24T08:17:24.467120592Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"x94cyrsz","id":"1(@)"}
+{"time":"2025-09-24T08:30:05.177516323Z","level":"INFO","msg":"server: parent process exited, terminating service process"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..cf5a1525220aa808cfa90f72069feb46b52fb122
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/logs/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-09-24T08:17:23.326318231Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T08:17:24.467070131Z","level":"INFO","msg":"stream: created new stream","id":"x94cyrsz"}
+{"time":"2025-09-24T08:17:24.467115362Z","level":"INFO","msg":"stream: started","id":"x94cyrsz"}
+{"time":"2025-09-24T08:17:24.467134242Z","level":"INFO","msg":"writer: started","stream_id":"x94cyrsz"}
+{"time":"2025-09-24T08:17:24.467160842Z","level":"INFO","msg":"handler: started","stream_id":"x94cyrsz"}
+{"time":"2025-09-24T08:17:24.467181922Z","level":"INFO","msg":"sender: started","stream_id":"x94cyrsz"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/logs/debug.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/run-x94cyrsz.wandb b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/run-x94cyrsz.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..6b418b12f9f8b27dbb9363859bf2bdbdf7df8bdc
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_081723-x94cyrsz/run-x94cyrsz.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1360a8680aa88b649f2afe6311355b0142408cd109faaf70fe75674abe89fd73
+size 131072
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/output.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..968657c2dd580c173cbdcff61ed90dd3f8d65b7c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/output.log
@@ -0,0 +1,61931 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/24 [08:24:18] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best', 0.6, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.4, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/24 [08:24:20] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+ INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/a1/Lerobot_Glue_best
+****** length of the dataset: 17698
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+09/24 [08:24:22] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=True, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Add lora to model.transformer successful!
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* get lora params name: llm_params[0]: blocks.7._fsdp_wrapped_module.ff_proj.parametrizations.weight.0.lora_A
+************* After get lora params successfully
+09/24 [08:25:55] INFO | >> Constructing optimizer with 1 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 39071
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=39,071
+09/24 [08:25:56] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+09/24 [08:26:04] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109
+ of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed
+ want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor
+ by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered
+ internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.)
+ param_grad = param.grad
+
+[step=1/500000]
+ train/ActionNoiseL2Loss=1.569
+ throughput/total_tokens=192,000
+ System/Peak GPU Memory (MB)=43,837
+[step=2/500000]
+ train/ActionNoiseL2Loss=1.582
+ throughput/total_tokens=384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=44,437
+[step=3/500000]
+ train/ActionNoiseL2Loss=1.702
+ throughput/total_tokens=576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4/500000]
+ train/ActionNoiseL2Loss=1.503
+ throughput/total_tokens=768,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=5/500000]
+ train/ActionNoiseL2Loss=1.557
+ throughput/total_tokens=960,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=6/500000]
+ train/ActionNoiseL2Loss=1.514
+ throughput/total_tokens=1,152,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=7/500000]
+ train/ActionNoiseL2Loss=1.491
+ throughput/total_tokens=1,344,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=8/500000]
+ train/ActionNoiseL2Loss=1.476
+ throughput/total_tokens=1,536,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=9/500000]
+ train/ActionNoiseL2Loss=1.444
+ throughput/total_tokens=1,728,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=10/500000]
+ train/ActionNoiseL2Loss=1.495
+ throughput/total_tokens=1,920,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,437
+[step=11/500000]
+ train/ActionNoiseL2Loss=1.482
+ throughput/total_tokens=2,112,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=12/500000]
+ train/ActionNoiseL2Loss=1.406
+ throughput/total_tokens=2,304,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=13/500000]
+ train/ActionNoiseL2Loss=1.422
+ throughput/total_tokens=2,496,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=14/500000]
+ train/ActionNoiseL2Loss=1.368
+ throughput/total_tokens=2,688,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=15/500000]
+ train/ActionNoiseL2Loss=1.415
+ throughput/total_tokens=2,880,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=16/500000]
+ train/ActionNoiseL2Loss=1.391
+ throughput/total_tokens=3,072,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=17/500000]
+ train/ActionNoiseL2Loss=1.281
+ throughput/total_tokens=3,264,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=18/500000]
+ train/ActionNoiseL2Loss=1.238
+ throughput/total_tokens=3,456,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=19/500000]
+ train/ActionNoiseL2Loss=1.270
+ throughput/total_tokens=3,648,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=20/500000]
+ optim/total_grad_norm=15.14
+ train/ActionNoiseL2Loss=1.260
+ throughput/total_tokens=3,840,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,437
+[step=21/500000]
+ train/ActionNoiseL2Loss=1.309
+ throughput/total_tokens=4,032,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=22/500000]
+ train/ActionNoiseL2Loss=1.268
+ throughput/total_tokens=4,224,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=23/500000]
+ train/ActionNoiseL2Loss=1.275
+ throughput/total_tokens=4,416,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=24/500000]
+ train/ActionNoiseL2Loss=1.223
+ throughput/total_tokens=4,608,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=25/500000]
+ train/ActionNoiseL2Loss=1.273
+ throughput/total_tokens=4,800,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=26/500000]
+ train/ActionNoiseL2Loss=1.177
+ throughput/total_tokens=4,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=27/500000]
+ train/ActionNoiseL2Loss=1.196
+ throughput/total_tokens=5,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=28/500000]
+ train/ActionNoiseL2Loss=1.231
+ throughput/total_tokens=5,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=29/500000]
+ train/ActionNoiseL2Loss=1.176
+ throughput/total_tokens=5,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=30/500000]
+ train/ActionNoiseL2Loss=1.144
+ throughput/total_tokens=5,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=31/500000]
+ train/ActionNoiseL2Loss=1.082
+ throughput/total_tokens=5,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=32/500000]
+ train/ActionNoiseL2Loss=1.061
+ throughput/total_tokens=6,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=33/500000]
+ train/ActionNoiseL2Loss=1.082
+ throughput/total_tokens=6,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=34/500000]
+ train/ActionNoiseL2Loss=1.022
+ throughput/total_tokens=6,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=35/500000]
+ train/ActionNoiseL2Loss=0.9993
+ throughput/total_tokens=6,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=36/500000]
+ train/ActionNoiseL2Loss=1.103
+ throughput/total_tokens=6,912,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=37/500000]
+ train/ActionNoiseL2Loss=0.9701
+ throughput/total_tokens=7,104,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=38/500000]
+ train/ActionNoiseL2Loss=1.045
+ throughput/total_tokens=7,296,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=39/500000]
+ train/ActionNoiseL2Loss=1.206
+ throughput/total_tokens=7,488,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=40/500000]
+ optim/total_grad_norm=10.84
+ train/ActionNoiseL2Loss=0.9799
+ throughput/total_tokens=7,680,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=41/500000]
+ train/ActionNoiseL2Loss=0.9294
+ throughput/total_tokens=7,872,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=42/500000]
+ train/ActionNoiseL2Loss=0.9044
+ throughput/total_tokens=8,064,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=43/500000]
+ train/ActionNoiseL2Loss=1.082
+ throughput/total_tokens=8,256,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=44/500000]
+ train/ActionNoiseL2Loss=1.063
+ throughput/total_tokens=8,448,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=45/500000]
+ train/ActionNoiseL2Loss=1.033
+ throughput/total_tokens=8,640,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=46/500000]
+ train/ActionNoiseL2Loss=1.044
+ throughput/total_tokens=8,832,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=47/500000]
+ train/ActionNoiseL2Loss=1.008
+ throughput/total_tokens=9,024,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=48/500000]
+ train/ActionNoiseL2Loss=1.068
+ throughput/total_tokens=9,216,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=49/500000]
+ train/ActionNoiseL2Loss=1.043
+ throughput/total_tokens=9,408,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=50/500000]
+ train/ActionNoiseL2Loss=0.8276
+ throughput/total_tokens=9,600,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=51/500000]
+ train/ActionNoiseL2Loss=0.8855
+ throughput/total_tokens=9,792,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=52/500000]
+ train/ActionNoiseL2Loss=0.8058
+ throughput/total_tokens=9,984,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=53/500000]
+ train/ActionNoiseL2Loss=0.7920
+ throughput/total_tokens=10,176,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=54/500000]
+ train/ActionNoiseL2Loss=0.9990
+ throughput/total_tokens=10,368,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=55/500000]
+ train/ActionNoiseL2Loss=1.007
+ throughput/total_tokens=10,560,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=56/500000]
+ train/ActionNoiseL2Loss=0.8870
+ throughput/total_tokens=10,752,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=57/500000]
+ train/ActionNoiseL2Loss=0.7525
+ throughput/total_tokens=10,944,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=58/500000]
+ train/ActionNoiseL2Loss=0.7209
+ throughput/total_tokens=11,136,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=59/500000]
+ train/ActionNoiseL2Loss=0.7539
+ throughput/total_tokens=11,328,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=60/500000]
+ optim/total_grad_norm=10.70
+ train/ActionNoiseL2Loss=0.7880
+ throughput/total_tokens=11,520,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,437
+[step=61/500000]
+ train/ActionNoiseL2Loss=0.8949
+ throughput/total_tokens=11,712,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=62/500000]
+ train/ActionNoiseL2Loss=0.6930
+ throughput/total_tokens=11,904,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=63/500000]
+ train/ActionNoiseL2Loss=0.7788
+ throughput/total_tokens=12,096,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=64/500000]
+ train/ActionNoiseL2Loss=0.6957
+ throughput/total_tokens=12,288,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=65/500000]
+ train/ActionNoiseL2Loss=0.8098
+ throughput/total_tokens=12,480,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=66/500000]
+ train/ActionNoiseL2Loss=0.7080
+ throughput/total_tokens=12,672,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=67/500000]
+ train/ActionNoiseL2Loss=0.7430
+ throughput/total_tokens=12,864,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=68/500000]
+ train/ActionNoiseL2Loss=0.6479
+ throughput/total_tokens=13,056,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=69/500000]
+ train/ActionNoiseL2Loss=0.6914
+ throughput/total_tokens=13,248,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=70/500000]
+ train/ActionNoiseL2Loss=0.6274
+ throughput/total_tokens=13,440,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=71/500000]
+ train/ActionNoiseL2Loss=0.6927
+ throughput/total_tokens=13,632,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=72/500000]
+ train/ActionNoiseL2Loss=0.7260
+ throughput/total_tokens=13,824,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=73/500000]
+ train/ActionNoiseL2Loss=0.6665
+ throughput/total_tokens=14,016,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=74/500000]
+ train/ActionNoiseL2Loss=0.6069
+ throughput/total_tokens=14,208,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=75/500000]
+ train/ActionNoiseL2Loss=0.6036
+ throughput/total_tokens=14,400,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=76/500000]
+ train/ActionNoiseL2Loss=0.6710
+ throughput/total_tokens=14,592,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=77/500000]
+ train/ActionNoiseL2Loss=0.6308
+ throughput/total_tokens=14,784,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=78/500000]
+ train/ActionNoiseL2Loss=0.5842
+ throughput/total_tokens=14,976,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=79/500000]
+ train/ActionNoiseL2Loss=0.6715
+ throughput/total_tokens=15,168,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=80/500000]
+ optim/total_grad_norm=8.614
+ train/ActionNoiseL2Loss=0.5620
+ throughput/total_tokens=15,360,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=81/500000]
+ train/ActionNoiseL2Loss=0.7159
+ throughput/total_tokens=15,552,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=82/500000]
+ train/ActionNoiseL2Loss=0.5694
+ throughput/total_tokens=15,744,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=83/500000]
+ train/ActionNoiseL2Loss=0.7084
+ throughput/total_tokens=15,936,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=84/500000]
+ train/ActionNoiseL2Loss=0.6174
+ throughput/total_tokens=16,128,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=85/500000]
+ train/ActionNoiseL2Loss=0.7009
+ throughput/total_tokens=16,320,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=86/500000]
+ train/ActionNoiseL2Loss=0.6158
+ throughput/total_tokens=16,512,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=87/500000]
+ train/ActionNoiseL2Loss=0.5469
+ throughput/total_tokens=16,704,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=88/500000]
+ train/ActionNoiseL2Loss=0.6513
+ throughput/total_tokens=16,896,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=89/500000]
+ train/ActionNoiseL2Loss=0.6622
+ throughput/total_tokens=17,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=90/500000]
+ train/ActionNoiseL2Loss=0.5459
+ throughput/total_tokens=17,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=91/500000]
+ train/ActionNoiseL2Loss=0.5624
+ throughput/total_tokens=17,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=92/500000]
+ train/ActionNoiseL2Loss=0.5821
+ throughput/total_tokens=17,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=93/500000]
+ train/ActionNoiseL2Loss=0.5289
+ throughput/total_tokens=17,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=94/500000]
+ train/ActionNoiseL2Loss=0.5281
+ throughput/total_tokens=18,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=95/500000]
+ train/ActionNoiseL2Loss=0.4883
+ throughput/total_tokens=18,240,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=96/500000]
+ train/ActionNoiseL2Loss=0.6415
+ throughput/total_tokens=18,432,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=97/500000]
+ train/ActionNoiseL2Loss=0.5573
+ throughput/total_tokens=18,624,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=98/500000]
+ train/ActionNoiseL2Loss=0.6545
+ throughput/total_tokens=18,816,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=99/500000]
+ train/ActionNoiseL2Loss=0.6126
+ throughput/total_tokens=19,008,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=100/500000]
+ optim/total_grad_norm=13.69
+ train/ActionNoiseL2Loss=0.6471
+ throughput/total_tokens=19,200,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=101/500000]
+ train/ActionNoiseL2Loss=0.6327
+ throughput/total_tokens=19,392,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=102/500000]
+ train/ActionNoiseL2Loss=0.5801
+ throughput/total_tokens=19,584,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=103/500000]
+ train/ActionNoiseL2Loss=0.5606
+ throughput/total_tokens=19,776,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=104/500000]
+ train/ActionNoiseL2Loss=0.5618
+ throughput/total_tokens=19,968,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=105/500000]
+ train/ActionNoiseL2Loss=0.5412
+ throughput/total_tokens=20,160,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=106/500000]
+ train/ActionNoiseL2Loss=0.7053
+ throughput/total_tokens=20,352,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=107/500000]
+ train/ActionNoiseL2Loss=0.4865
+ throughput/total_tokens=20,544,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=108/500000]
+ train/ActionNoiseL2Loss=0.5624
+ throughput/total_tokens=20,736,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=109/500000]
+ train/ActionNoiseL2Loss=0.5282
+ throughput/total_tokens=20,928,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=110/500000]
+ train/ActionNoiseL2Loss=0.3917
+ throughput/total_tokens=21,120,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=111/500000]
+ train/ActionNoiseL2Loss=0.4262
+ throughput/total_tokens=21,312,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=112/500000]
+ train/ActionNoiseL2Loss=0.5530
+ throughput/total_tokens=21,504,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=113/500000]
+ train/ActionNoiseL2Loss=0.4333
+ throughput/total_tokens=21,696,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=114/500000]
+ train/ActionNoiseL2Loss=0.5370
+ throughput/total_tokens=21,888,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=115/500000]
+ train/ActionNoiseL2Loss=0.6218
+ throughput/total_tokens=22,080,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=116/500000]
+ train/ActionNoiseL2Loss=0.4263
+ throughput/total_tokens=22,272,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=117/500000]
+ train/ActionNoiseL2Loss=0.5854
+ throughput/total_tokens=22,464,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=118/500000]
+ train/ActionNoiseL2Loss=0.6948
+ throughput/total_tokens=22,656,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=119/500000]
+ train/ActionNoiseL2Loss=0.5762
+ throughput/total_tokens=22,848,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=120/500000]
+ optim/total_grad_norm=12.06
+ train/ActionNoiseL2Loss=0.5165
+ throughput/total_tokens=23,040,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=121/500000]
+ train/ActionNoiseL2Loss=0.5504
+ throughput/total_tokens=23,232,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=122/500000]
+ train/ActionNoiseL2Loss=0.5132
+ throughput/total_tokens=23,424,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=123/500000]
+ train/ActionNoiseL2Loss=0.5707
+ throughput/total_tokens=23,616,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=124/500000]
+ train/ActionNoiseL2Loss=0.5780
+ throughput/total_tokens=23,808,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=125/500000]
+ train/ActionNoiseL2Loss=0.5004
+ throughput/total_tokens=24,000,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=126/500000]
+ train/ActionNoiseL2Loss=0.5587
+ throughput/total_tokens=24,192,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=127/500000]
+ train/ActionNoiseL2Loss=0.5877
+ throughput/total_tokens=24,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=128/500000]
+ train/ActionNoiseL2Loss=0.6882
+ throughput/total_tokens=24,576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=129/500000]
+ train/ActionNoiseL2Loss=0.5347
+ throughput/total_tokens=24,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=130/500000]
+ train/ActionNoiseL2Loss=0.5290
+ throughput/total_tokens=24,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=131/500000]
+ train/ActionNoiseL2Loss=0.5746
+ throughput/total_tokens=25,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=132/500000]
+ train/ActionNoiseL2Loss=0.4129
+ throughput/total_tokens=25,344,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=133/500000]
+ train/ActionNoiseL2Loss=0.6028
+ throughput/total_tokens=25,536,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=134/500000]
+ train/ActionNoiseL2Loss=0.5032
+ throughput/total_tokens=25,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=135/500000]
+ train/ActionNoiseL2Loss=0.5292
+ throughput/total_tokens=25,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=136/500000]
+ train/ActionNoiseL2Loss=0.6097
+ throughput/total_tokens=26,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=137/500000]
+ train/ActionNoiseL2Loss=0.5402
+ throughput/total_tokens=26,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=138/500000]
+ train/ActionNoiseL2Loss=0.6016
+ throughput/total_tokens=26,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=139/500000]
+ train/ActionNoiseL2Loss=0.4734
+ throughput/total_tokens=26,688,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=140/500000]
+ optim/total_grad_norm=10.38
+ train/ActionNoiseL2Loss=0.4516
+ throughput/total_tokens=26,880,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=141/500000]
+ train/ActionNoiseL2Loss=0.4594
+ throughput/total_tokens=27,072,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=142/500000]
+ train/ActionNoiseL2Loss=0.4584
+ throughput/total_tokens=27,264,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=143/500000]
+ train/ActionNoiseL2Loss=0.4533
+ throughput/total_tokens=27,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=144/500000]
+ train/ActionNoiseL2Loss=0.4657
+ throughput/total_tokens=27,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=145/500000]
+ train/ActionNoiseL2Loss=0.5507
+ throughput/total_tokens=27,840,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=146/500000]
+ train/ActionNoiseL2Loss=0.4442
+ throughput/total_tokens=28,032,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=147/500000]
+ train/ActionNoiseL2Loss=0.3964
+ throughput/total_tokens=28,224,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=148/500000]
+ train/ActionNoiseL2Loss=0.3630
+ throughput/total_tokens=28,416,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=149/500000]
+ train/ActionNoiseL2Loss=0.3701
+ throughput/total_tokens=28,608,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=150/500000]
+ train/ActionNoiseL2Loss=0.4735
+ throughput/total_tokens=28,800,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=151/500000]
+ train/ActionNoiseL2Loss=0.4492
+ throughput/total_tokens=28,992,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=152/500000]
+ train/ActionNoiseL2Loss=0.4994
+ throughput/total_tokens=29,184,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=153/500000]
+ train/ActionNoiseL2Loss=0.5274
+ throughput/total_tokens=29,376,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=154/500000]
+ train/ActionNoiseL2Loss=0.4801
+ throughput/total_tokens=29,568,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=155/500000]
+ train/ActionNoiseL2Loss=0.5265
+ throughput/total_tokens=29,760,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=156/500000]
+ train/ActionNoiseL2Loss=0.3136
+ throughput/total_tokens=29,952,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=157/500000]
+ train/ActionNoiseL2Loss=0.5350
+ throughput/total_tokens=30,144,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=158/500000]
+ train/ActionNoiseL2Loss=0.4568
+ throughput/total_tokens=30,336,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=159/500000]
+ train/ActionNoiseL2Loss=0.3060
+ throughput/total_tokens=30,528,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=160/500000]
+ optim/total_grad_norm=14.59
+ train/ActionNoiseL2Loss=0.5800
+ throughput/total_tokens=30,720,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=161/500000]
+ train/ActionNoiseL2Loss=0.5676
+ throughput/total_tokens=30,912,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=162/500000]
+ train/ActionNoiseL2Loss=0.5126
+ throughput/total_tokens=31,104,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=163/500000]
+ train/ActionNoiseL2Loss=0.4615
+ throughput/total_tokens=31,296,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=164/500000]
+ train/ActionNoiseL2Loss=0.5150
+ throughput/total_tokens=31,488,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=165/500000]
+ train/ActionNoiseL2Loss=0.4892
+ throughput/total_tokens=31,680,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=166/500000]
+ train/ActionNoiseL2Loss=0.4940
+ throughput/total_tokens=31,872,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=167/500000]
+ train/ActionNoiseL2Loss=0.3978
+ throughput/total_tokens=32,064,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=168/500000]
+ train/ActionNoiseL2Loss=0.5723
+ throughput/total_tokens=32,256,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=169/500000]
+ train/ActionNoiseL2Loss=0.4538
+ throughput/total_tokens=32,448,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=170/500000]
+ train/ActionNoiseL2Loss=0.5181
+ throughput/total_tokens=32,640,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=171/500000]
+ train/ActionNoiseL2Loss=0.4013
+ throughput/total_tokens=32,832,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=172/500000]
+ train/ActionNoiseL2Loss=0.3651
+ throughput/total_tokens=33,024,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=173/500000]
+ train/ActionNoiseL2Loss=0.3756
+ throughput/total_tokens=33,216,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=174/500000]
+ train/ActionNoiseL2Loss=0.3959
+ throughput/total_tokens=33,408,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=175/500000]
+ train/ActionNoiseL2Loss=0.4638
+ throughput/total_tokens=33,600,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=176/500000]
+ train/ActionNoiseL2Loss=0.3258
+ throughput/total_tokens=33,792,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=177/500000]
+ train/ActionNoiseL2Loss=0.5035
+ throughput/total_tokens=33,984,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=178/500000]
+ train/ActionNoiseL2Loss=0.6318
+ throughput/total_tokens=34,176,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=179/500000]
+ train/ActionNoiseL2Loss=0.4376
+ throughput/total_tokens=34,368,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=180/500000]
+ optim/total_grad_norm=12.53
+ train/ActionNoiseL2Loss=0.4790
+ throughput/total_tokens=34,560,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=181/500000]
+ train/ActionNoiseL2Loss=0.3576
+ throughput/total_tokens=34,752,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=182/500000]
+ train/ActionNoiseL2Loss=0.4612
+ throughput/total_tokens=34,944,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=183/500000]
+ train/ActionNoiseL2Loss=0.4910
+ throughput/total_tokens=35,136,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=184/500000]
+ train/ActionNoiseL2Loss=0.5728
+ throughput/total_tokens=35,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=185/500000]
+ train/ActionNoiseL2Loss=0.5238
+ throughput/total_tokens=35,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=186/500000]
+ train/ActionNoiseL2Loss=0.3720
+ throughput/total_tokens=35,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=187/500000]
+ train/ActionNoiseL2Loss=0.3488
+ throughput/total_tokens=35,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=188/500000]
+ train/ActionNoiseL2Loss=0.3491
+ throughput/total_tokens=36,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=189/500000]
+ train/ActionNoiseL2Loss=0.7017
+ throughput/total_tokens=36,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=190/500000]
+ train/ActionNoiseL2Loss=0.3530
+ throughput/total_tokens=36,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=191/500000]
+ train/ActionNoiseL2Loss=0.3894
+ throughput/total_tokens=36,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=192/500000]
+ train/ActionNoiseL2Loss=0.3983
+ throughput/total_tokens=36,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=193/500000]
+ train/ActionNoiseL2Loss=0.4406
+ throughput/total_tokens=37,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=194/500000]
+ train/ActionNoiseL2Loss=0.3711
+ throughput/total_tokens=37,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=195/500000]
+ train/ActionNoiseL2Loss=0.5858
+ throughput/total_tokens=37,440,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=196/500000]
+ train/ActionNoiseL2Loss=0.3708
+ throughput/total_tokens=37,632,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=197/500000]
+ train/ActionNoiseL2Loss=0.4106
+ throughput/total_tokens=37,824,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=198/500000]
+ train/ActionNoiseL2Loss=0.2970
+ throughput/total_tokens=38,016,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=199/500000]
+ train/ActionNoiseL2Loss=0.3415
+ throughput/total_tokens=38,208,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=200/500000]
+ optim/total_grad_norm=12.62
+ train/ActionNoiseL2Loss=0.5188
+ throughput/total_tokens=38,400,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=201/500000]
+ train/ActionNoiseL2Loss=0.4025
+ throughput/total_tokens=38,592,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=202/500000]
+ train/ActionNoiseL2Loss=0.4267
+ throughput/total_tokens=38,784,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=203/500000]
+ train/ActionNoiseL2Loss=0.3954
+ throughput/total_tokens=38,976,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=204/500000]
+ train/ActionNoiseL2Loss=0.3486
+ throughput/total_tokens=39,168,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=205/500000]
+ train/ActionNoiseL2Loss=0.2886
+ throughput/total_tokens=39,360,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=206/500000]
+ train/ActionNoiseL2Loss=0.2863
+ throughput/total_tokens=39,552,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=207/500000]
+ train/ActionNoiseL2Loss=0.5374
+ throughput/total_tokens=39,744,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=208/500000]
+ train/ActionNoiseL2Loss=0.4213
+ throughput/total_tokens=39,936,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=209/500000]
+ train/ActionNoiseL2Loss=0.3586
+ throughput/total_tokens=40,128,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=210/500000]
+ train/ActionNoiseL2Loss=0.3894
+ throughput/total_tokens=40,320,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=211/500000]
+ train/ActionNoiseL2Loss=0.4765
+ throughput/total_tokens=40,512,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=212/500000]
+ train/ActionNoiseL2Loss=0.2992
+ throughput/total_tokens=40,704,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=213/500000]
+ train/ActionNoiseL2Loss=0.4936
+ throughput/total_tokens=40,896,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=214/500000]
+ train/ActionNoiseL2Loss=0.4120
+ throughput/total_tokens=41,088,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=215/500000]
+ train/ActionNoiseL2Loss=0.4753
+ throughput/total_tokens=41,280,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=216/500000]
+ train/ActionNoiseL2Loss=0.5332
+ throughput/total_tokens=41,472,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=217/500000]
+ train/ActionNoiseL2Loss=0.4299
+ throughput/total_tokens=41,664,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=218/500000]
+ train/ActionNoiseL2Loss=0.4390
+ throughput/total_tokens=41,856,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=219/500000]
+ train/ActionNoiseL2Loss=0.3085
+ throughput/total_tokens=42,048,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=220/500000]
+ optim/total_grad_norm=13.00
+ train/ActionNoiseL2Loss=0.3470
+ throughput/total_tokens=42,240,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=221/500000]
+ train/ActionNoiseL2Loss=0.2923
+ throughput/total_tokens=42,432,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=222/500000]
+ train/ActionNoiseL2Loss=0.3682
+ throughput/total_tokens=42,624,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=223/500000]
+ train/ActionNoiseL2Loss=0.3666
+ throughput/total_tokens=42,816,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=224/500000]
+ train/ActionNoiseL2Loss=0.3445
+ throughput/total_tokens=43,008,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=225/500000]
+ train/ActionNoiseL2Loss=0.3867
+ throughput/total_tokens=43,200,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=226/500000]
+ train/ActionNoiseL2Loss=0.3650
+ throughput/total_tokens=43,392,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=227/500000]
+ train/ActionNoiseL2Loss=0.5095
+ throughput/total_tokens=43,584,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=228/500000]
+ train/ActionNoiseL2Loss=0.3884
+ throughput/total_tokens=43,776,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=229/500000]
+ train/ActionNoiseL2Loss=0.4709
+ throughput/total_tokens=43,968,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=230/500000]
+ train/ActionNoiseL2Loss=0.3686
+ throughput/total_tokens=44,160,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=231/500000]
+ train/ActionNoiseL2Loss=0.4406
+ throughput/total_tokens=44,352,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=232/500000]
+ train/ActionNoiseL2Loss=0.2809
+ throughput/total_tokens=44,544,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=233/500000]
+ train/ActionNoiseL2Loss=0.3434
+ throughput/total_tokens=44,736,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=234/500000]
+ train/ActionNoiseL2Loss=0.3986
+ throughput/total_tokens=44,928,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=235/500000]
+ train/ActionNoiseL2Loss=0.3462
+ throughput/total_tokens=45,120,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=236/500000]
+ train/ActionNoiseL2Loss=0.3549
+ throughput/total_tokens=45,312,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=237/500000]
+ train/ActionNoiseL2Loss=0.2596
+ throughput/total_tokens=45,504,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=238/500000]
+ train/ActionNoiseL2Loss=0.2900
+ throughput/total_tokens=45,696,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=239/500000]
+ train/ActionNoiseL2Loss=0.2246
+ throughput/total_tokens=45,888,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=240/500000]
+ optim/total_grad_norm=15.25
+ train/ActionNoiseL2Loss=0.3734
+ throughput/total_tokens=46,080,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=241/500000]
+ train/ActionNoiseL2Loss=0.4162
+ throughput/total_tokens=46,272,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=242/500000]
+ train/ActionNoiseL2Loss=0.3286
+ throughput/total_tokens=46,464,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=243/500000]
+ train/ActionNoiseL2Loss=0.3389
+ throughput/total_tokens=46,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=244/500000]
+ train/ActionNoiseL2Loss=0.2953
+ throughput/total_tokens=46,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=245/500000]
+ train/ActionNoiseL2Loss=0.2594
+ throughput/total_tokens=47,040,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=246/500000]
+ train/ActionNoiseL2Loss=0.3170
+ throughput/total_tokens=47,232,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=247/500000]
+ train/ActionNoiseL2Loss=0.4147
+ throughput/total_tokens=47,424,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=248/500000]
+ train/ActionNoiseL2Loss=0.3247
+ throughput/total_tokens=47,616,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=249/500000]
+ train/ActionNoiseL2Loss=0.3538
+ throughput/total_tokens=47,808,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=250/500000]
+ train/ActionNoiseL2Loss=0.2941
+ throughput/total_tokens=48,000,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=251/500000]
+ train/ActionNoiseL2Loss=0.3450
+ throughput/total_tokens=48,192,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=252/500000]
+ train/ActionNoiseL2Loss=0.2645
+ throughput/total_tokens=48,384,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=253/500000]
+ train/ActionNoiseL2Loss=0.2738
+ throughput/total_tokens=48,576,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=254/500000]
+ train/ActionNoiseL2Loss=0.3682
+ throughput/total_tokens=48,768,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=255/500000]
+ train/ActionNoiseL2Loss=0.1653
+ throughput/total_tokens=48,960,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=256/500000]
+ train/ActionNoiseL2Loss=0.3210
+ throughput/total_tokens=49,152,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=257/500000]
+ train/ActionNoiseL2Loss=0.2582
+ throughput/total_tokens=49,344,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=258/500000]
+ train/ActionNoiseL2Loss=0.2498
+ throughput/total_tokens=49,536,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=259/500000]
+ train/ActionNoiseL2Loss=0.3840
+ throughput/total_tokens=49,728,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=260/500000]
+ optim/total_grad_norm=14.26
+ train/ActionNoiseL2Loss=0.3413
+ throughput/total_tokens=49,920,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=261/500000]
+ train/ActionNoiseL2Loss=0.2522
+ throughput/total_tokens=50,112,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=262/500000]
+ train/ActionNoiseL2Loss=0.3285
+ throughput/total_tokens=50,304,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=263/500000]
+ train/ActionNoiseL2Loss=0.2454
+ throughput/total_tokens=50,496,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=264/500000]
+ train/ActionNoiseL2Loss=0.2964
+ throughput/total_tokens=50,688,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=265/500000]
+ train/ActionNoiseL2Loss=0.4043
+ throughput/total_tokens=50,880,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=266/500000]
+ train/ActionNoiseL2Loss=0.2258
+ throughput/total_tokens=51,072,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=267/500000]
+ train/ActionNoiseL2Loss=0.2664
+ throughput/total_tokens=51,264,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=268/500000]
+ train/ActionNoiseL2Loss=0.3579
+ throughput/total_tokens=51,456,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=269/500000]
+ train/ActionNoiseL2Loss=0.4528
+ throughput/total_tokens=51,648,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=270/500000]
+ train/ActionNoiseL2Loss=0.3439
+ throughput/total_tokens=51,840,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=271/500000]
+ train/ActionNoiseL2Loss=0.3625
+ throughput/total_tokens=52,032,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=272/500000]
+ train/ActionNoiseL2Loss=0.2663
+ throughput/total_tokens=52,224,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=273/500000]
+ train/ActionNoiseL2Loss=0.3743
+ throughput/total_tokens=52,416,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=274/500000]
+ train/ActionNoiseL2Loss=0.3549
+ throughput/total_tokens=52,608,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=275/500000]
+ train/ActionNoiseL2Loss=0.1818
+ throughput/total_tokens=52,800,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=276/500000]
+ train/ActionNoiseL2Loss=0.2599
+ throughput/total_tokens=52,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=277/500000]
+ train/ActionNoiseL2Loss=0.3468
+ throughput/total_tokens=53,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=278/500000]
+ train/ActionNoiseL2Loss=0.2363
+ throughput/total_tokens=53,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=279/500000]
+ train/ActionNoiseL2Loss=0.2895
+ throughput/total_tokens=53,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=280/500000]
+ optim/total_grad_norm=11.58
+ train/ActionNoiseL2Loss=0.2460
+ throughput/total_tokens=53,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=281/500000]
+ train/ActionNoiseL2Loss=0.2877
+ throughput/total_tokens=53,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=282/500000]
+ train/ActionNoiseL2Loss=0.3049
+ throughput/total_tokens=54,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=283/500000]
+ train/ActionNoiseL2Loss=0.2950
+ throughput/total_tokens=54,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=284/500000]
+ train/ActionNoiseL2Loss=0.3405
+ throughput/total_tokens=54,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=285/500000]
+ train/ActionNoiseL2Loss=0.1935
+ throughput/total_tokens=54,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=286/500000]
+ train/ActionNoiseL2Loss=0.3600
+ throughput/total_tokens=54,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=287/500000]
+ train/ActionNoiseL2Loss=0.2499
+ throughput/total_tokens=55,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=288/500000]
+ train/ActionNoiseL2Loss=0.3168
+ throughput/total_tokens=55,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=289/500000]
+ train/ActionNoiseL2Loss=0.3026
+ throughput/total_tokens=55,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=290/500000]
+ train/ActionNoiseL2Loss=0.2752
+ throughput/total_tokens=55,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=291/500000]
+ train/ActionNoiseL2Loss=0.2280
+ throughput/total_tokens=55,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=292/500000]
+ train/ActionNoiseL2Loss=0.2118
+ throughput/total_tokens=56,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=293/500000]
+ train/ActionNoiseL2Loss=0.2669
+ throughput/total_tokens=56,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=294/500000]
+ train/ActionNoiseL2Loss=0.1738
+ throughput/total_tokens=56,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=295/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=56,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=296/500000]
+ train/ActionNoiseL2Loss=0.2201
+ throughput/total_tokens=56,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=297/500000]
+ train/ActionNoiseL2Loss=0.2514
+ throughput/total_tokens=57,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=298/500000]
+ train/ActionNoiseL2Loss=0.3522
+ throughput/total_tokens=57,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=299/500000]
+ train/ActionNoiseL2Loss=0.2240
+ throughput/total_tokens=57,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=300/500000]
+ optim/total_grad_norm=12.18
+ train/ActionNoiseL2Loss=0.4209
+ throughput/total_tokens=57,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=301/500000]
+ train/ActionNoiseL2Loss=0.2282
+ throughput/total_tokens=57,792,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=302/500000]
+ train/ActionNoiseL2Loss=0.2457
+ throughput/total_tokens=57,984,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=303/500000]
+ train/ActionNoiseL2Loss=0.1539
+ throughput/total_tokens=58,176,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=304/500000]
+ train/ActionNoiseL2Loss=0.3161
+ throughput/total_tokens=58,368,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=305/500000]
+ train/ActionNoiseL2Loss=0.2030
+ throughput/total_tokens=58,560,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=306/500000]
+ train/ActionNoiseL2Loss=0.2568
+ throughput/total_tokens=58,752,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=307/500000]
+ train/ActionNoiseL2Loss=0.3128
+ throughput/total_tokens=58,944,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=308/500000]
+ train/ActionNoiseL2Loss=0.2548
+ throughput/total_tokens=59,136,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=309/500000]
+ train/ActionNoiseL2Loss=0.2677
+ throughput/total_tokens=59,328,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=310/500000]
+ train/ActionNoiseL2Loss=0.2691
+ throughput/total_tokens=59,520,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=311/500000]
+ train/ActionNoiseL2Loss=0.2493
+ throughput/total_tokens=59,712,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=312/500000]
+ train/ActionNoiseL2Loss=0.2451
+ throughput/total_tokens=59,904,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=313/500000]
+ train/ActionNoiseL2Loss=0.2843
+ throughput/total_tokens=60,096,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=314/500000]
+ train/ActionNoiseL2Loss=0.2751
+ throughput/total_tokens=60,288,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=315/500000]
+ train/ActionNoiseL2Loss=0.2292
+ throughput/total_tokens=60,480,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=316/500000]
+ train/ActionNoiseL2Loss=0.2332
+ throughput/total_tokens=60,672,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=317/500000]
+ train/ActionNoiseL2Loss=0.2436
+ throughput/total_tokens=60,864,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=318/500000]
+ train/ActionNoiseL2Loss=0.2528
+ throughput/total_tokens=61,056,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=319/500000]
+ train/ActionNoiseL2Loss=0.2377
+ throughput/total_tokens=61,248,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=320/500000]
+ optim/total_grad_norm=9.705
+ train/ActionNoiseL2Loss=0.2677
+ throughput/total_tokens=61,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=321/500000]
+ train/ActionNoiseL2Loss=0.2237
+ throughput/total_tokens=61,632,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=322/500000]
+ train/ActionNoiseL2Loss=0.3765
+ throughput/total_tokens=61,824,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=323/500000]
+ train/ActionNoiseL2Loss=0.2815
+ throughput/total_tokens=62,016,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=324/500000]
+ train/ActionNoiseL2Loss=0.1956
+ throughput/total_tokens=62,208,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=325/500000]
+ train/ActionNoiseL2Loss=0.3011
+ throughput/total_tokens=62,400,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=326/500000]
+ train/ActionNoiseL2Loss=0.2256
+ throughput/total_tokens=62,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=327/500000]
+ train/ActionNoiseL2Loss=0.3224
+ throughput/total_tokens=62,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=328/500000]
+ train/ActionNoiseL2Loss=0.1988
+ throughput/total_tokens=62,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=329/500000]
+ train/ActionNoiseL2Loss=0.2126
+ throughput/total_tokens=63,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=330/500000]
+ train/ActionNoiseL2Loss=0.3466
+ throughput/total_tokens=63,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=331/500000]
+ train/ActionNoiseL2Loss=0.1872
+ throughput/total_tokens=63,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=332/500000]
+ train/ActionNoiseL2Loss=0.1834
+ throughput/total_tokens=63,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=333/500000]
+ train/ActionNoiseL2Loss=0.2237
+ throughput/total_tokens=63,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=334/500000]
+ train/ActionNoiseL2Loss=0.2120
+ throughput/total_tokens=64,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=335/500000]
+ train/ActionNoiseL2Loss=0.2061
+ throughput/total_tokens=64,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=336/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=64,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=337/500000]
+ train/ActionNoiseL2Loss=0.3791
+ throughput/total_tokens=64,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=338/500000]
+ train/ActionNoiseL2Loss=0.3835
+ throughput/total_tokens=64,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=339/500000]
+ train/ActionNoiseL2Loss=0.3345
+ throughput/total_tokens=65,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=340/500000]
+ optim/total_grad_norm=7.915
+ train/ActionNoiseL2Loss=0.2232
+ throughput/total_tokens=65,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=341/500000]
+ train/ActionNoiseL2Loss=0.2668
+ throughput/total_tokens=65,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=342/500000]
+ train/ActionNoiseL2Loss=0.2778
+ throughput/total_tokens=65,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=343/500000]
+ train/ActionNoiseL2Loss=0.2526
+ throughput/total_tokens=65,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=344/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=66,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=345/500000]
+ train/ActionNoiseL2Loss=0.2164
+ throughput/total_tokens=66,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=346/500000]
+ train/ActionNoiseL2Loss=0.1734
+ throughput/total_tokens=66,432,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=347/500000]
+ train/ActionNoiseL2Loss=0.2007
+ throughput/total_tokens=66,624,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=348/500000]
+ train/ActionNoiseL2Loss=0.2074
+ throughput/total_tokens=66,816,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=349/500000]
+ train/ActionNoiseL2Loss=0.3083
+ throughput/total_tokens=67,008,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=350/500000]
+ train/ActionNoiseL2Loss=0.2392
+ throughput/total_tokens=67,200,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=351/500000]
+ train/ActionNoiseL2Loss=0.2078
+ throughput/total_tokens=67,392,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=352/500000]
+ train/ActionNoiseL2Loss=0.2084
+ throughput/total_tokens=67,584,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=353/500000]
+ train/ActionNoiseL2Loss=0.1872
+ throughput/total_tokens=67,776,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=354/500000]
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=67,968,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=355/500000]
+ train/ActionNoiseL2Loss=0.2380
+ throughput/total_tokens=68,160,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=356/500000]
+ train/ActionNoiseL2Loss=0.3129
+ throughput/total_tokens=68,352,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=357/500000]
+ train/ActionNoiseL2Loss=0.2432
+ throughput/total_tokens=68,544,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=358/500000]
+ train/ActionNoiseL2Loss=0.2682
+ throughput/total_tokens=68,736,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=359/500000]
+ train/ActionNoiseL2Loss=0.1431
+ throughput/total_tokens=68,928,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=360/500000]
+ optim/total_grad_norm=10.35
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=69,120,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=361/500000]
+ train/ActionNoiseL2Loss=0.2031
+ throughput/total_tokens=69,312,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=362/500000]
+ train/ActionNoiseL2Loss=0.2624
+ throughput/total_tokens=69,504,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=363/500000]
+ train/ActionNoiseL2Loss=0.2376
+ throughput/total_tokens=69,696,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=364/500000]
+ train/ActionNoiseL2Loss=0.2408
+ throughput/total_tokens=69,888,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=365/500000]
+ train/ActionNoiseL2Loss=0.2538
+ throughput/total_tokens=70,080,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=366/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=70,272,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=367/500000]
+ train/ActionNoiseL2Loss=0.2233
+ throughput/total_tokens=70,464,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=368/500000]
+ train/ActionNoiseL2Loss=0.1873
+ throughput/total_tokens=70,656,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=369/500000]
+ train/ActionNoiseL2Loss=0.2805
+ throughput/total_tokens=70,848,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=370/500000]
+ train/ActionNoiseL2Loss=0.1981
+ throughput/total_tokens=71,040,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=371/500000]
+ train/ActionNoiseL2Loss=0.2314
+ throughput/total_tokens=71,232,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=372/500000]
+ train/ActionNoiseL2Loss=0.1985
+ throughput/total_tokens=71,424,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=373/500000]
+ train/ActionNoiseL2Loss=0.2016
+ throughput/total_tokens=71,616,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=374/500000]
+ train/ActionNoiseL2Loss=0.2686
+ throughput/total_tokens=71,808,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=375/500000]
+ train/ActionNoiseL2Loss=0.1908
+ throughput/total_tokens=72,000,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=376/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=72,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=377/500000]
+ train/ActionNoiseL2Loss=0.2040
+ throughput/total_tokens=72,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=378/500000]
+ train/ActionNoiseL2Loss=0.2176
+ throughput/total_tokens=72,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=379/500000]
+ train/ActionNoiseL2Loss=0.2067
+ throughput/total_tokens=72,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=380/500000]
+ optim/total_grad_norm=9.630
+ train/ActionNoiseL2Loss=0.1875
+ throughput/total_tokens=72,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=381/500000]
+ train/ActionNoiseL2Loss=0.1411
+ throughput/total_tokens=73,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=382/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=73,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=383/500000]
+ train/ActionNoiseL2Loss=0.3487
+ throughput/total_tokens=73,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=384/500000]
+ train/ActionNoiseL2Loss=0.2186
+ throughput/total_tokens=73,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=385/500000]
+ train/ActionNoiseL2Loss=0.1765
+ throughput/total_tokens=73,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=386/500000]
+ train/ActionNoiseL2Loss=0.3876
+ throughput/total_tokens=74,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=387/500000]
+ train/ActionNoiseL2Loss=0.2071
+ throughput/total_tokens=74,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=388/500000]
+ train/ActionNoiseL2Loss=0.1706
+ throughput/total_tokens=74,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=389/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=74,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=390/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=74,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=391/500000]
+ train/ActionNoiseL2Loss=0.3077
+ throughput/total_tokens=75,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=392/500000]
+ train/ActionNoiseL2Loss=0.1965
+ throughput/total_tokens=75,264,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=393/500000]
+ train/ActionNoiseL2Loss=0.2254
+ throughput/total_tokens=75,456,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=394/500000]
+ train/ActionNoiseL2Loss=0.2223
+ throughput/total_tokens=75,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=395/500000]
+ train/ActionNoiseL2Loss=0.3349
+ throughput/total_tokens=75,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=396/500000]
+ train/ActionNoiseL2Loss=0.1950
+ throughput/total_tokens=76,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=397/500000]
+ train/ActionNoiseL2Loss=0.3117
+ throughput/total_tokens=76,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=398/500000]
+ train/ActionNoiseL2Loss=0.2009
+ throughput/total_tokens=76,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=399/500000]
+ train/ActionNoiseL2Loss=0.1706
+ throughput/total_tokens=76,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=400/500000]
+ optim/total_grad_norm=9.348
+ train/ActionNoiseL2Loss=0.2601
+ throughput/total_tokens=76,800,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=401/500000]
+ train/ActionNoiseL2Loss=0.2746
+ throughput/total_tokens=76,992,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=402/500000]
+ train/ActionNoiseL2Loss=0.1568
+ throughput/total_tokens=77,184,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=403/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=77,376,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=404/500000]
+ train/ActionNoiseL2Loss=0.1968
+ throughput/total_tokens=77,568,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=405/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=77,760,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=406/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=77,952,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=407/500000]
+ train/ActionNoiseL2Loss=0.1999
+ throughput/total_tokens=78,144,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=408/500000]
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=78,336,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=409/500000]
+ train/ActionNoiseL2Loss=0.2145
+ throughput/total_tokens=78,528,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=410/500000]
+ train/ActionNoiseL2Loss=0.2533
+ throughput/total_tokens=78,720,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=411/500000]
+ train/ActionNoiseL2Loss=0.1719
+ throughput/total_tokens=78,912,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=412/500000]
+ train/ActionNoiseL2Loss=0.3008
+ throughput/total_tokens=79,104,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=413/500000]
+ train/ActionNoiseL2Loss=0.2197
+ throughput/total_tokens=79,296,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=414/500000]
+ train/ActionNoiseL2Loss=0.1888
+ throughput/total_tokens=79,488,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=415/500000]
+ train/ActionNoiseL2Loss=0.2120
+ throughput/total_tokens=79,680,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=416/500000]
+ train/ActionNoiseL2Loss=0.1732
+ throughput/total_tokens=79,872,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=417/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=80,064,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=418/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=80,256,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=419/500000]
+ train/ActionNoiseL2Loss=0.2314
+ throughput/total_tokens=80,448,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=420/500000]
+ optim/total_grad_norm=9.671
+ train/ActionNoiseL2Loss=0.2808
+ throughput/total_tokens=80,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=421/500000]
+ train/ActionNoiseL2Loss=0.1809
+ throughput/total_tokens=80,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=422/500000]
+ train/ActionNoiseL2Loss=0.1709
+ throughput/total_tokens=81,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=423/500000]
+ train/ActionNoiseL2Loss=0.1867
+ throughput/total_tokens=81,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=424/500000]
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=81,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=425/500000]
+ train/ActionNoiseL2Loss=0.2313
+ throughput/total_tokens=81,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=426/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=81,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=427/500000]
+ train/ActionNoiseL2Loss=0.2666
+ throughput/total_tokens=81,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=428/500000]
+ train/ActionNoiseL2Loss=0.1677
+ throughput/total_tokens=82,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=429/500000]
+ train/ActionNoiseL2Loss=0.2136
+ throughput/total_tokens=82,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=430/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=82,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=431/500000]
+ train/ActionNoiseL2Loss=0.1783
+ throughput/total_tokens=82,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=432/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=82,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=433/500000]
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=83,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=434/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=83,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=435/500000]
+ train/ActionNoiseL2Loss=0.1706
+ throughput/total_tokens=83,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=436/500000]
+ train/ActionNoiseL2Loss=0.1963
+ throughput/total_tokens=83,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=437/500000]
+ train/ActionNoiseL2Loss=0.2339
+ throughput/total_tokens=83,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=438/500000]
+ train/ActionNoiseL2Loss=0.1803
+ throughput/total_tokens=84,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=439/500000]
+ train/ActionNoiseL2Loss=0.2020
+ throughput/total_tokens=84,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=440/500000]
+ optim/total_grad_norm=7.491
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=84,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=441/500000]
+ train/ActionNoiseL2Loss=0.2483
+ throughput/total_tokens=84,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=442/500000]
+ train/ActionNoiseL2Loss=0.1991
+ throughput/total_tokens=84,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=443/500000]
+ train/ActionNoiseL2Loss=0.1747
+ throughput/total_tokens=85,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=444/500000]
+ train/ActionNoiseL2Loss=0.1765
+ throughput/total_tokens=85,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=445/500000]
+ train/ActionNoiseL2Loss=0.2093
+ throughput/total_tokens=85,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=446/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=85,632,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=447/500000]
+ train/ActionNoiseL2Loss=0.1965
+ throughput/total_tokens=85,824,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=448/500000]
+ train/ActionNoiseL2Loss=0.1922
+ throughput/total_tokens=86,016,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=449/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=86,208,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=450/500000]
+ train/ActionNoiseL2Loss=0.1695
+ throughput/total_tokens=86,400,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=451/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=86,592,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=452/500000]
+ train/ActionNoiseL2Loss=0.2029
+ throughput/total_tokens=86,784,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=453/500000]
+ train/ActionNoiseL2Loss=0.3075
+ throughput/total_tokens=86,976,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=454/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=87,168,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=455/500000]
+ train/ActionNoiseL2Loss=0.2619
+ throughput/total_tokens=87,360,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=456/500000]
+ train/ActionNoiseL2Loss=0.2284
+ throughput/total_tokens=87,552,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=457/500000]
+ train/ActionNoiseL2Loss=0.2195
+ throughput/total_tokens=87,744,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=458/500000]
+ train/ActionNoiseL2Loss=0.2224
+ throughput/total_tokens=87,936,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=459/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=88,128,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=460/500000]
+ optim/total_grad_norm=10.41
+ train/ActionNoiseL2Loss=0.1988
+ throughput/total_tokens=88,320,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=461/500000]
+ train/ActionNoiseL2Loss=0.2170
+ throughput/total_tokens=88,512,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=462/500000]
+ train/ActionNoiseL2Loss=0.2263
+ throughput/total_tokens=88,704,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=463/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=88,896,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=464/500000]
+ train/ActionNoiseL2Loss=0.1455
+ throughput/total_tokens=89,088,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=465/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=89,280,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=466/500000]
+ train/ActionNoiseL2Loss=0.1842
+ throughput/total_tokens=89,472,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=467/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=89,664,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=468/500000]
+ train/ActionNoiseL2Loss=0.3020
+ throughput/total_tokens=89,856,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=469/500000]
+ train/ActionNoiseL2Loss=0.1685
+ throughput/total_tokens=90,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=470/500000]
+ train/ActionNoiseL2Loss=0.1859
+ throughput/total_tokens=90,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=471/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=90,432,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=472/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=90,624,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=473/500000]
+ train/ActionNoiseL2Loss=0.1796
+ throughput/total_tokens=90,816,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=474/500000]
+ train/ActionNoiseL2Loss=0.2230
+ throughput/total_tokens=91,008,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=475/500000]
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=91,200,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=476/500000]
+ train/ActionNoiseL2Loss=0.2154
+ throughput/total_tokens=91,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=477/500000]
+ train/ActionNoiseL2Loss=0.1906
+ throughput/total_tokens=91,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=478/500000]
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=91,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=479/500000]
+ train/ActionNoiseL2Loss=0.2079
+ throughput/total_tokens=91,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=480/500000]
+ optim/total_grad_norm=9.048
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=92,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=481/500000]
+ train/ActionNoiseL2Loss=0.2354
+ throughput/total_tokens=92,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=482/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=92,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=483/500000]
+ train/ActionNoiseL2Loss=0.2870
+ throughput/total_tokens=92,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=484/500000]
+ train/ActionNoiseL2Loss=0.1864
+ throughput/total_tokens=92,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=485/500000]
+ train/ActionNoiseL2Loss=0.1991
+ throughput/total_tokens=93,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=486/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=93,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=487/500000]
+ train/ActionNoiseL2Loss=0.1593
+ throughput/total_tokens=93,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=488/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=93,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=489/500000]
+ train/ActionNoiseL2Loss=0.1995
+ throughput/total_tokens=93,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=490/500000]
+ train/ActionNoiseL2Loss=0.1911
+ throughput/total_tokens=94,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=491/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=94,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=492/500000]
+ train/ActionNoiseL2Loss=0.1793
+ throughput/total_tokens=94,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=493/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=94,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=494/500000]
+ train/ActionNoiseL2Loss=0.1876
+ throughput/total_tokens=94,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=495/500000]
+ train/ActionNoiseL2Loss=0.2359
+ throughput/total_tokens=95,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=496/500000]
+ train/ActionNoiseL2Loss=0.2422
+ throughput/total_tokens=95,232,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=497/500000]
+ train/ActionNoiseL2Loss=0.1743
+ throughput/total_tokens=95,424,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=498/500000]
+ train/ActionNoiseL2Loss=0.2059
+ throughput/total_tokens=95,616,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=499/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=95,808,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=500/500000]
+ optim/total_grad_norm=7.464
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=96,000,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/24 [11:24:08] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109
+ FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and
+ set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc:
+ https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial:
+ https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html .
+ warnings.warn(
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109
+ `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object
+ collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use
+ `_device_capability(group)`.
+ warnings.warn(
+
+09/24 [11:24:11] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ local_shape = tensor.shape
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.shape,
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.dtype,
+
+09/24 [11:24:14] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109
+ instead and we are deprecating ShardedTensor.
+ result = torch_func_method(public_api, types, args, kwargs)
+
+09/24 [11:24:31] INFO | >> Saving config... checkpoint.py:608
+09/24 [11:24:58] INFO | >> Saving model state... checkpoint.py:796
+09/24 [11:25:59] INFO | >> Saving optim state... checkpoint.py:811
+09/24 [11:26:04] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=501/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=96,192,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=502/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=96,384,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=503/500000]
+ train/ActionNoiseL2Loss=0.2379
+ throughput/total_tokens=96,576,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=504/500000]
+ train/ActionNoiseL2Loss=0.2780
+ throughput/total_tokens=96,768,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=505/500000]
+ train/ActionNoiseL2Loss=0.1914
+ throughput/total_tokens=96,960,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=506/500000]
+ train/ActionNoiseL2Loss=0.1939
+ throughput/total_tokens=97,152,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=507/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=97,344,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=508/500000]
+ train/ActionNoiseL2Loss=0.1476
+ throughput/total_tokens=97,536,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=509/500000]
+ train/ActionNoiseL2Loss=0.1759
+ throughput/total_tokens=97,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=510/500000]
+ train/ActionNoiseL2Loss=0.1712
+ throughput/total_tokens=97,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=511/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=98,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=512/500000]
+ train/ActionNoiseL2Loss=0.2377
+ throughput/total_tokens=98,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=513/500000]
+ train/ActionNoiseL2Loss=0.1934
+ throughput/total_tokens=98,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=514/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=98,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=515/500000]
+ train/ActionNoiseL2Loss=0.1576
+ throughput/total_tokens=98,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=516/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=99,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=517/500000]
+ train/ActionNoiseL2Loss=0.1516
+ throughput/total_tokens=99,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=518/500000]
+ train/ActionNoiseL2Loss=0.1623
+ throughput/total_tokens=99,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=519/500000]
+ train/ActionNoiseL2Loss=0.2969
+ throughput/total_tokens=99,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=520/500000]
+ optim/total_grad_norm=9.796
+ train/ActionNoiseL2Loss=0.1721
+ throughput/total_tokens=99,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=521/500000]
+ train/ActionNoiseL2Loss=0.1940
+ throughput/total_tokens=100,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=522/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=100,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=523/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=100,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=524/500000]
+ train/ActionNoiseL2Loss=0.2764
+ throughput/total_tokens=100,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=525/500000]
+ train/ActionNoiseL2Loss=0.2654
+ throughput/total_tokens=100,800,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=526/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=100,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=527/500000]
+ train/ActionNoiseL2Loss=0.2684
+ throughput/total_tokens=101,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=528/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=101,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=529/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=101,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=530/500000]
+ train/ActionNoiseL2Loss=0.1938
+ throughput/total_tokens=101,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=531/500000]
+ train/ActionNoiseL2Loss=0.1433
+ throughput/total_tokens=101,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=532/500000]
+ train/ActionNoiseL2Loss=0.2195
+ throughput/total_tokens=102,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=533/500000]
+ train/ActionNoiseL2Loss=0.3007
+ throughput/total_tokens=102,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=534/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=102,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=535/500000]
+ train/ActionNoiseL2Loss=0.2314
+ throughput/total_tokens=102,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=536/500000]
+ train/ActionNoiseL2Loss=0.1676
+ throughput/total_tokens=102,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=537/500000]
+ train/ActionNoiseL2Loss=0.2711
+ throughput/total_tokens=103,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=538/500000]
+ train/ActionNoiseL2Loss=0.2384
+ throughput/total_tokens=103,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=539/500000]
+ train/ActionNoiseL2Loss=0.1348
+ throughput/total_tokens=103,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=540/500000]
+ optim/total_grad_norm=5.142
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=103,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=541/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=103,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=542/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=104,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=543/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=104,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=544/500000]
+ train/ActionNoiseL2Loss=0.1637
+ throughput/total_tokens=104,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=545/500000]
+ train/ActionNoiseL2Loss=0.2088
+ throughput/total_tokens=104,640,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=546/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=104,832,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=547/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=105,024,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=548/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=105,216,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=549/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=105,408,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=550/500000]
+ train/ActionNoiseL2Loss=0.2263
+ throughput/total_tokens=105,600,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=551/500000]
+ train/ActionNoiseL2Loss=0.1461
+ throughput/total_tokens=105,792,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=552/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=105,984,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=553/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=106,176,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=554/500000]
+ train/ActionNoiseL2Loss=0.2688
+ throughput/total_tokens=106,368,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=555/500000]
+ train/ActionNoiseL2Loss=0.3086
+ throughput/total_tokens=106,560,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=556/500000]
+ train/ActionNoiseL2Loss=0.1693
+ throughput/total_tokens=106,752,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=557/500000]
+ train/ActionNoiseL2Loss=0.1584
+ throughput/total_tokens=106,944,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=558/500000]
+ train/ActionNoiseL2Loss=0.2135
+ throughput/total_tokens=107,136,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=559/500000]
+ train/ActionNoiseL2Loss=0.2604
+ throughput/total_tokens=107,328,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=560/500000]
+ optim/total_grad_norm=8.154
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=107,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=561/500000]
+ train/ActionNoiseL2Loss=0.1878
+ throughput/total_tokens=107,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=562/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=107,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=563/500000]
+ train/ActionNoiseL2Loss=0.1761
+ throughput/total_tokens=108,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=564/500000]
+ train/ActionNoiseL2Loss=0.2419
+ throughput/total_tokens=108,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=565/500000]
+ train/ActionNoiseL2Loss=0.2025
+ throughput/total_tokens=108,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=566/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=108,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=567/500000]
+ train/ActionNoiseL2Loss=0.1853
+ throughput/total_tokens=108,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=568/500000]
+ train/ActionNoiseL2Loss=0.2834
+ throughput/total_tokens=109,056,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=569/500000]
+ train/ActionNoiseL2Loss=0.1703
+ throughput/total_tokens=109,248,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=570/500000]
+ train/ActionNoiseL2Loss=0.2129
+ throughput/total_tokens=109,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=571/500000]
+ train/ActionNoiseL2Loss=0.1894
+ throughput/total_tokens=109,632,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=572/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=109,824,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=573/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=110,016,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=574/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=110,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=575/500000]
+ train/ActionNoiseL2Loss=0.1887
+ throughput/total_tokens=110,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=576/500000]
+ train/ActionNoiseL2Loss=0.1425
+ throughput/total_tokens=110,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=577/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=110,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=578/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=110,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=579/500000]
+ train/ActionNoiseL2Loss=0.2348
+ throughput/total_tokens=111,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=580/500000]
+ optim/total_grad_norm=11.25
+ train/ActionNoiseL2Loss=0.2376
+ throughput/total_tokens=111,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=581/500000]
+ train/ActionNoiseL2Loss=0.2760
+ throughput/total_tokens=111,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=582/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=111,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=583/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=111,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=584/500000]
+ train/ActionNoiseL2Loss=0.2042
+ throughput/total_tokens=112,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=585/500000]
+ train/ActionNoiseL2Loss=0.1711
+ throughput/total_tokens=112,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=586/500000]
+ train/ActionNoiseL2Loss=0.1924
+ throughput/total_tokens=112,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=587/500000]
+ train/ActionNoiseL2Loss=0.1822
+ throughput/total_tokens=112,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=588/500000]
+ train/ActionNoiseL2Loss=0.1924
+ throughput/total_tokens=112,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=589/500000]
+ train/ActionNoiseL2Loss=0.2936
+ throughput/total_tokens=113,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=590/500000]
+ train/ActionNoiseL2Loss=0.2554
+ throughput/total_tokens=113,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=591/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=113,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=592/500000]
+ train/ActionNoiseL2Loss=0.1673
+ throughput/total_tokens=113,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=593/500000]
+ train/ActionNoiseL2Loss=0.2103
+ throughput/total_tokens=113,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=594/500000]
+ train/ActionNoiseL2Loss=0.2147
+ throughput/total_tokens=114,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=595/500000]
+ train/ActionNoiseL2Loss=0.2069
+ throughput/total_tokens=114,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=596/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=114,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=597/500000]
+ train/ActionNoiseL2Loss=0.2116
+ throughput/total_tokens=114,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=598/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=114,816,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=599/500000]
+ train/ActionNoiseL2Loss=0.1810
+ throughput/total_tokens=115,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=600/500000]
+ optim/total_grad_norm=5.829
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=115,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=601/500000]
+ train/ActionNoiseL2Loss=0.2485
+ throughput/total_tokens=115,392,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=602/500000]
+ train/ActionNoiseL2Loss=0.2350
+ throughput/total_tokens=115,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=603/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=115,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=604/500000]
+ train/ActionNoiseL2Loss=0.1891
+ throughput/total_tokens=115,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=605/500000]
+ train/ActionNoiseL2Loss=0.1409
+ throughput/total_tokens=116,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=606/500000]
+ train/ActionNoiseL2Loss=0.1483
+ throughput/total_tokens=116,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=607/500000]
+ train/ActionNoiseL2Loss=0.1873
+ throughput/total_tokens=116,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=608/500000]
+ train/ActionNoiseL2Loss=0.1757
+ throughput/total_tokens=116,736,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=609/500000]
+ train/ActionNoiseL2Loss=0.2142
+ throughput/total_tokens=116,928,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=610/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=117,120,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=611/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=117,312,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=612/500000]
+ train/ActionNoiseL2Loss=0.1897
+ throughput/total_tokens=117,504,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=613/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=117,696,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=614/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=117,888,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=615/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=118,080,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=616/500000]
+ train/ActionNoiseL2Loss=0.2043
+ throughput/total_tokens=118,272,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=617/500000]
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=118,464,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=618/500000]
+ train/ActionNoiseL2Loss=0.1872
+ throughput/total_tokens=118,656,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=619/500000]
+ train/ActionNoiseL2Loss=0.2615
+ throughput/total_tokens=118,848,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=620/500000]
+ optim/total_grad_norm=8.089
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=119,040,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=621/500000]
+ train/ActionNoiseL2Loss=0.1660
+ throughput/total_tokens=119,232,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=622/500000]
+ train/ActionNoiseL2Loss=0.1475
+ throughput/total_tokens=119,424,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=623/500000]
+ train/ActionNoiseL2Loss=0.1857
+ throughput/total_tokens=119,616,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=624/500000]
+ train/ActionNoiseL2Loss=0.2095
+ throughput/total_tokens=119,808,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=625/500000]
+ train/ActionNoiseL2Loss=0.1921
+ throughput/total_tokens=120,000,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=626/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=120,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=627/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=120,384,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=628/500000]
+ train/ActionNoiseL2Loss=0.2353
+ throughput/total_tokens=120,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=629/500000]
+ train/ActionNoiseL2Loss=0.1956
+ throughput/total_tokens=120,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=630/500000]
+ train/ActionNoiseL2Loss=0.2157
+ throughput/total_tokens=120,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=631/500000]
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=121,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=632/500000]
+ train/ActionNoiseL2Loss=0.2953
+ throughput/total_tokens=121,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=633/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=121,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=634/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=121,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=635/500000]
+ train/ActionNoiseL2Loss=0.1756
+ throughput/total_tokens=121,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=636/500000]
+ train/ActionNoiseL2Loss=0.2657
+ throughput/total_tokens=122,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=637/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=122,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=638/500000]
+ train/ActionNoiseL2Loss=0.2693
+ throughput/total_tokens=122,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=639/500000]
+ train/ActionNoiseL2Loss=0.1371
+ throughput/total_tokens=122,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=640/500000]
+ optim/total_grad_norm=7.359
+ train/ActionNoiseL2Loss=0.1271
+ throughput/total_tokens=122,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=641/500000]
+ train/ActionNoiseL2Loss=0.2991
+ throughput/total_tokens=123,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=642/500000]
+ train/ActionNoiseL2Loss=0.2071
+ throughput/total_tokens=123,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=643/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=123,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=644/500000]
+ train/ActionNoiseL2Loss=0.2042
+ throughput/total_tokens=123,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=645/500000]
+ train/ActionNoiseL2Loss=0.2134
+ throughput/total_tokens=123,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=646/500000]
+ train/ActionNoiseL2Loss=0.1735
+ throughput/total_tokens=124,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=647/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=124,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=648/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=124,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=649/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=124,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=650/500000]
+ train/ActionNoiseL2Loss=0.1811
+ throughput/total_tokens=124,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=651/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=124,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=652/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=125,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=653/500000]
+ train/ActionNoiseL2Loss=0.1787
+ throughput/total_tokens=125,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=654/500000]
+ train/ActionNoiseL2Loss=0.1585
+ throughput/total_tokens=125,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=655/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=125,760,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=656/500000]
+ train/ActionNoiseL2Loss=0.1488
+ throughput/total_tokens=125,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=657/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=126,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=658/500000]
+ train/ActionNoiseL2Loss=0.2565
+ throughput/total_tokens=126,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=659/500000]
+ train/ActionNoiseL2Loss=0.1593
+ throughput/total_tokens=126,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=660/500000]
+ optim/total_grad_norm=11.55
+ train/ActionNoiseL2Loss=0.2360
+ throughput/total_tokens=126,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=661/500000]
+ train/ActionNoiseL2Loss=0.2175
+ throughput/total_tokens=126,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=662/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=127,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=663/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=127,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=664/500000]
+ train/ActionNoiseL2Loss=0.3475
+ throughput/total_tokens=127,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=665/500000]
+ train/ActionNoiseL2Loss=0.2571
+ throughput/total_tokens=127,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=666/500000]
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=127,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=667/500000]
+ train/ActionNoiseL2Loss=0.3848
+ throughput/total_tokens=128,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=668/500000]
+ train/ActionNoiseL2Loss=0.1611
+ throughput/total_tokens=128,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=669/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=128,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=670/500000]
+ train/ActionNoiseL2Loss=0.1941
+ throughput/total_tokens=128,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=671/500000]
+ train/ActionNoiseL2Loss=0.1415
+ throughput/total_tokens=128,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=672/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=129,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=673/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=129,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=674/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=129,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=675/500000]
+ train/ActionNoiseL2Loss=0.1942
+ throughput/total_tokens=129,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=676/500000]
+ train/ActionNoiseL2Loss=0.1807
+ throughput/total_tokens=129,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=677/500000]
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=129,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=678/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=130,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=679/500000]
+ train/ActionNoiseL2Loss=0.1949
+ throughput/total_tokens=130,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=680/500000]
+ optim/total_grad_norm=15.32
+ train/ActionNoiseL2Loss=0.4153
+ throughput/total_tokens=130,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=681/500000]
+ train/ActionNoiseL2Loss=0.1570
+ throughput/total_tokens=130,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=682/500000]
+ train/ActionNoiseL2Loss=0.1536
+ throughput/total_tokens=130,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=683/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=131,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=684/500000]
+ train/ActionNoiseL2Loss=0.3053
+ throughput/total_tokens=131,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=685/500000]
+ train/ActionNoiseL2Loss=0.1723
+ throughput/total_tokens=131,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=686/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=131,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=687/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=131,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=688/500000]
+ train/ActionNoiseL2Loss=0.1643
+ throughput/total_tokens=132,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=689/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=132,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=690/500000]
+ train/ActionNoiseL2Loss=0.2457
+ throughput/total_tokens=132,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=691/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=132,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=692/500000]
+ train/ActionNoiseL2Loss=0.1532
+ throughput/total_tokens=132,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=693/500000]
+ train/ActionNoiseL2Loss=0.2361
+ throughput/total_tokens=133,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=694/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=133,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=695/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=133,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=696/500000]
+ train/ActionNoiseL2Loss=0.3140
+ throughput/total_tokens=133,632,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=697/500000]
+ train/ActionNoiseL2Loss=0.1929
+ throughput/total_tokens=133,824,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=698/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=134,016,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=699/500000]
+ train/ActionNoiseL2Loss=0.2203
+ throughput/total_tokens=134,208,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=700/500000]
+ optim/total_grad_norm=8.431
+ train/ActionNoiseL2Loss=0.1880
+ throughput/total_tokens=134,400,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=701/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=134,592,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=702/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=134,784,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=703/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=134,976,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=704/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=135,168,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=705/500000]
+ train/ActionNoiseL2Loss=0.2342
+ throughput/total_tokens=135,360,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=706/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=135,552,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=707/500000]
+ train/ActionNoiseL2Loss=0.2411
+ throughput/total_tokens=135,744,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=708/500000]
+ train/ActionNoiseL2Loss=0.2152
+ throughput/total_tokens=135,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=709/500000]
+ train/ActionNoiseL2Loss=0.2224
+ throughput/total_tokens=136,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=710/500000]
+ train/ActionNoiseL2Loss=0.2475
+ throughput/total_tokens=136,320,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=711/500000]
+ train/ActionNoiseL2Loss=0.2332
+ throughput/total_tokens=136,512,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=712/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=136,704,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=713/500000]
+ train/ActionNoiseL2Loss=0.2320
+ throughput/total_tokens=136,896,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=714/500000]
+ train/ActionNoiseL2Loss=0.1642
+ throughput/total_tokens=137,088,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=715/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=137,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=716/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=137,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=717/500000]
+ train/ActionNoiseL2Loss=0.1637
+ throughput/total_tokens=137,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=718/500000]
+ train/ActionNoiseL2Loss=0.1825
+ throughput/total_tokens=137,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=719/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=138,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=720/500000]
+ optim/total_grad_norm=7.116
+ train/ActionNoiseL2Loss=0.2043
+ throughput/total_tokens=138,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=721/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=138,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=722/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=138,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=723/500000]
+ train/ActionNoiseL2Loss=0.2216
+ throughput/total_tokens=138,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=724/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=139,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=725/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=139,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=726/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=139,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=727/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=139,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=728/500000]
+ train/ActionNoiseL2Loss=0.1742
+ throughput/total_tokens=139,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=729/500000]
+ train/ActionNoiseL2Loss=0.1786
+ throughput/total_tokens=139,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=730/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=140,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=731/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=140,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=732/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=140,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=733/500000]
+ train/ActionNoiseL2Loss=0.2036
+ throughput/total_tokens=140,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=734/500000]
+ train/ActionNoiseL2Loss=0.1451
+ throughput/total_tokens=140,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=735/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=141,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=736/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=141,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=737/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=141,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=738/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=141,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=739/500000]
+ train/ActionNoiseL2Loss=0.2125
+ throughput/total_tokens=141,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=740/500000]
+ optim/total_grad_norm=7.513
+ train/ActionNoiseL2Loss=0.2225
+ throughput/total_tokens=142,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=741/500000]
+ train/ActionNoiseL2Loss=0.2003
+ throughput/total_tokens=142,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=742/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=142,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=743/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=142,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=744/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=142,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=745/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=143,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=746/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=143,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=747/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=143,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=748/500000]
+ train/ActionNoiseL2Loss=0.1734
+ throughput/total_tokens=143,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=749/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=143,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=750/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=144,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=751/500000]
+ train/ActionNoiseL2Loss=0.1852
+ throughput/total_tokens=144,192,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=752/500000]
+ train/ActionNoiseL2Loss=0.2196
+ throughput/total_tokens=144,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=753/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=144,576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=754/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=144,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=755/500000]
+ train/ActionNoiseL2Loss=0.1316
+ throughput/total_tokens=144,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=756/500000]
+ train/ActionNoiseL2Loss=0.1985
+ throughput/total_tokens=145,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=757/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=145,344,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=758/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=145,536,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=759/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=145,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=760/500000]
+ optim/total_grad_norm=10.91
+ train/ActionNoiseL2Loss=0.2816
+ throughput/total_tokens=145,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=761/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=146,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=762/500000]
+ train/ActionNoiseL2Loss=0.2414
+ throughput/total_tokens=146,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=763/500000]
+ train/ActionNoiseL2Loss=0.2028
+ throughput/total_tokens=146,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=764/500000]
+ train/ActionNoiseL2Loss=0.1864
+ throughput/total_tokens=146,688,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=765/500000]
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=146,880,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=766/500000]
+ train/ActionNoiseL2Loss=0.2302
+ throughput/total_tokens=147,072,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=767/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=147,264,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=768/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=147,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=769/500000]
+ train/ActionNoiseL2Loss=0.1369
+ throughput/total_tokens=147,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=770/500000]
+ train/ActionNoiseL2Loss=0.1993
+ throughput/total_tokens=147,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=771/500000]
+ train/ActionNoiseL2Loss=0.1804
+ throughput/total_tokens=148,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=772/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=148,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=773/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=148,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=774/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=148,608,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=775/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=148,800,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=776/500000]
+ train/ActionNoiseL2Loss=0.2972
+ throughput/total_tokens=148,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=777/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=149,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=778/500000]
+ train/ActionNoiseL2Loss=0.1973
+ throughput/total_tokens=149,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=779/500000]
+ train/ActionNoiseL2Loss=0.1749
+ throughput/total_tokens=149,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=780/500000]
+ optim/total_grad_norm=9.309
+ train/ActionNoiseL2Loss=0.2419
+ throughput/total_tokens=149,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=781/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=149,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=782/500000]
+ train/ActionNoiseL2Loss=0.2090
+ throughput/total_tokens=150,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=783/500000]
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=150,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=784/500000]
+ train/ActionNoiseL2Loss=0.1621
+ throughput/total_tokens=150,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=785/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=150,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=786/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=150,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=787/500000]
+ train/ActionNoiseL2Loss=0.1990
+ throughput/total_tokens=151,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=788/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=151,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=789/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=151,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=790/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=151,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=791/500000]
+ train/ActionNoiseL2Loss=0.1952
+ throughput/total_tokens=151,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=792/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=152,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=793/500000]
+ train/ActionNoiseL2Loss=0.1703
+ throughput/total_tokens=152,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=794/500000]
+ train/ActionNoiseL2Loss=0.2050
+ throughput/total_tokens=152,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=795/500000]
+ train/ActionNoiseL2Loss=0.1915
+ throughput/total_tokens=152,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=796/500000]
+ train/ActionNoiseL2Loss=0.2131
+ throughput/total_tokens=152,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=797/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=153,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=798/500000]
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=153,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=799/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=153,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=800/500000]
+ optim/total_grad_norm=6.777
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=153,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=801/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=153,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=802/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=153,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=803/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=154,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=804/500000]
+ train/ActionNoiseL2Loss=0.1624
+ throughput/total_tokens=154,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=805/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=154,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=806/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=154,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=807/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=154,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=808/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=155,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=809/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=155,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=810/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=155,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=811/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=155,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=812/500000]
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=155,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=813/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=156,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=814/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=156,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=815/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=156,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=816/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=156,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=817/500000]
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=156,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=818/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=157,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=819/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=157,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=820/500000]
+ optim/total_grad_norm=6.368
+ train/ActionNoiseL2Loss=0.1240
+ throughput/total_tokens=157,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=821/500000]
+ train/ActionNoiseL2Loss=0.1924
+ throughput/total_tokens=157,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=822/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=157,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=823/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=158,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=824/500000]
+ train/ActionNoiseL2Loss=0.1804
+ throughput/total_tokens=158,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=825/500000]
+ train/ActionNoiseL2Loss=0.1658
+ throughput/total_tokens=158,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=826/500000]
+ train/ActionNoiseL2Loss=0.1806
+ throughput/total_tokens=158,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=827/500000]
+ train/ActionNoiseL2Loss=0.1598
+ throughput/total_tokens=158,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=828/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=158,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=829/500000]
+ train/ActionNoiseL2Loss=0.1404
+ throughput/total_tokens=159,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=830/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=159,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=831/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=159,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=832/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=159,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=833/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=159,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=834/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=160,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=835/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=160,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=836/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=160,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=837/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=160,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=838/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=160,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=839/500000]
+ train/ActionNoiseL2Loss=0.1931
+ throughput/total_tokens=161,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=840/500000]
+ optim/total_grad_norm=5.497
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=161,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=841/500000]
+ train/ActionNoiseL2Loss=0.1841
+ throughput/total_tokens=161,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=842/500000]
+ train/ActionNoiseL2Loss=0.1431
+ throughput/total_tokens=161,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=843/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=161,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=844/500000]
+ train/ActionNoiseL2Loss=0.1797
+ throughput/total_tokens=162,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=845/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=162,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=846/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=162,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=847/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=162,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=848/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=162,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=849/500000]
+ train/ActionNoiseL2Loss=0.1930
+ throughput/total_tokens=163,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=850/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=163,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=851/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=163,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=852/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=163,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=853/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=163,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=854/500000]
+ train/ActionNoiseL2Loss=0.1558
+ throughput/total_tokens=163,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=855/500000]
+ train/ActionNoiseL2Loss=0.2707
+ throughput/total_tokens=164,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=856/500000]
+ train/ActionNoiseL2Loss=0.1693
+ throughput/total_tokens=164,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=857/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=164,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=858/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=164,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=859/500000]
+ train/ActionNoiseL2Loss=0.3467
+ throughput/total_tokens=164,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=860/500000]
+ optim/total_grad_norm=8.669
+ train/ActionNoiseL2Loss=0.1516
+ throughput/total_tokens=165,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=861/500000]
+ train/ActionNoiseL2Loss=0.2021
+ throughput/total_tokens=165,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=862/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=165,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=863/500000]
+ train/ActionNoiseL2Loss=0.1905
+ throughput/total_tokens=165,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=864/500000]
+ train/ActionNoiseL2Loss=0.1983
+ throughput/total_tokens=165,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=865/500000]
+ train/ActionNoiseL2Loss=0.1929
+ throughput/total_tokens=166,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=866/500000]
+ train/ActionNoiseL2Loss=0.2987
+ throughput/total_tokens=166,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=867/500000]
+ train/ActionNoiseL2Loss=0.2137
+ throughput/total_tokens=166,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=868/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=166,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=869/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=166,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=870/500000]
+ train/ActionNoiseL2Loss=0.1632
+ throughput/total_tokens=167,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=871/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=167,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=872/500000]
+ train/ActionNoiseL2Loss=0.2206
+ throughput/total_tokens=167,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=873/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=167,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=874/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=167,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=875/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=168,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=876/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=168,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=877/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=168,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=878/500000]
+ train/ActionNoiseL2Loss=0.2061
+ throughput/total_tokens=168,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=879/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=168,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=880/500000]
+ optim/total_grad_norm=3.752
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=168,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=881/500000]
+ train/ActionNoiseL2Loss=0.1364
+ throughput/total_tokens=169,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=882/500000]
+ train/ActionNoiseL2Loss=0.1386
+ throughput/total_tokens=169,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=883/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=169,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=884/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=169,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=885/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=169,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=886/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=170,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=887/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=170,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=888/500000]
+ train/ActionNoiseL2Loss=0.2192
+ throughput/total_tokens=170,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=889/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=170,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=890/500000]
+ train/ActionNoiseL2Loss=0.1932
+ throughput/total_tokens=170,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=891/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=171,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=892/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=171,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=893/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=171,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=894/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=171,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=895/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=171,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=896/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=172,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=897/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=172,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=898/500000]
+ train/ActionNoiseL2Loss=0.1419
+ throughput/total_tokens=172,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=899/500000]
+ train/ActionNoiseL2Loss=0.1371
+ throughput/total_tokens=172,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=900/500000]
+ optim/total_grad_norm=4.053
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=172,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=901/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=172,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=902/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=173,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=903/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=173,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=904/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=173,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=905/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=173,760,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=906/500000]
+ train/ActionNoiseL2Loss=0.1630
+ throughput/total_tokens=173,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=907/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=174,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=908/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=174,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=909/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=174,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=910/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=174,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=911/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=174,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=912/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=175,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=913/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=175,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=914/500000]
+ train/ActionNoiseL2Loss=0.1525
+ throughput/total_tokens=175,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=915/500000]
+ train/ActionNoiseL2Loss=0.1679
+ throughput/total_tokens=175,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=916/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=175,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=917/500000]
+ train/ActionNoiseL2Loss=0.1640
+ throughput/total_tokens=176,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=918/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=176,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=919/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=176,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=920/500000]
+ optim/total_grad_norm=4.158
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=176,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=921/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=176,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=922/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=177,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=923/500000]
+ train/ActionNoiseL2Loss=0.1866
+ throughput/total_tokens=177,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=924/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=177,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=925/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=177,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=926/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=177,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=927/500000]
+ train/ActionNoiseL2Loss=0.1902
+ throughput/total_tokens=177,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=928/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=178,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=929/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=178,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=930/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=178,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=931/500000]
+ train/ActionNoiseL2Loss=0.3295
+ throughput/total_tokens=178,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=932/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=178,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=933/500000]
+ train/ActionNoiseL2Loss=0.2310
+ throughput/total_tokens=179,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=934/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=179,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=935/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=179,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=936/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=179,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=937/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=179,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=938/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=180,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=939/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=180,288,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=940/500000]
+ optim/total_grad_norm=6.654
+ train/ActionNoiseL2Loss=0.1685
+ throughput/total_tokens=180,480,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=941/500000]
+ train/ActionNoiseL2Loss=0.1375
+ throughput/total_tokens=180,672,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=942/500000]
+ train/ActionNoiseL2Loss=0.2358
+ throughput/total_tokens=180,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=943/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=181,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=944/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=181,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=945/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=181,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=946/500000]
+ train/ActionNoiseL2Loss=0.1842
+ throughput/total_tokens=181,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=947/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=181,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=948/500000]
+ train/ActionNoiseL2Loss=0.1488
+ throughput/total_tokens=182,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=949/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=182,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=950/500000]
+ train/ActionNoiseL2Loss=0.1882
+ throughput/total_tokens=182,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=951/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=182,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=952/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=182,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=953/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=182,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=954/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=183,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=955/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=183,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=956/500000]
+ train/ActionNoiseL2Loss=0.1811
+ throughput/total_tokens=183,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=957/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=183,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=958/500000]
+ train/ActionNoiseL2Loss=0.1881
+ throughput/total_tokens=183,936,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=959/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=184,128,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=960/500000]
+ optim/total_grad_norm=5.013
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=184,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=961/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=184,512,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=962/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=184,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=963/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=184,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=964/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=185,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=965/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=185,280,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=966/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=185,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=967/500000]
+ train/ActionNoiseL2Loss=0.1920
+ throughput/total_tokens=185,664,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=968/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=185,856,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=969/500000]
+ train/ActionNoiseL2Loss=0.1815
+ throughput/total_tokens=186,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=970/500000]
+ train/ActionNoiseL2Loss=0.2041
+ throughput/total_tokens=186,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=971/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=186,432,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=972/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=186,624,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=973/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=186,816,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=974/500000]
+ train/ActionNoiseL2Loss=0.2058
+ throughput/total_tokens=187,008,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=975/500000]
+ train/ActionNoiseL2Loss=0.2114
+ throughput/total_tokens=187,200,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=976/500000]
+ train/ActionNoiseL2Loss=0.1877
+ throughput/total_tokens=187,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=977/500000]
+ train/ActionNoiseL2Loss=0.1488
+ throughput/total_tokens=187,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=978/500000]
+ train/ActionNoiseL2Loss=0.1685
+ throughput/total_tokens=187,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=979/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=187,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=980/500000]
+ optim/total_grad_norm=4.533
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=188,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=981/500000]
+ train/ActionNoiseL2Loss=0.2031
+ throughput/total_tokens=188,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=982/500000]
+ train/ActionNoiseL2Loss=0.1848
+ throughput/total_tokens=188,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=983/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=188,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=984/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=188,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=985/500000]
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=189,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=986/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=189,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=987/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=189,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=988/500000]
+ train/ActionNoiseL2Loss=0.1679
+ throughput/total_tokens=189,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=989/500000]
+ train/ActionNoiseL2Loss=0.1894
+ throughput/total_tokens=189,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=990/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=190,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=991/500000]
+ train/ActionNoiseL2Loss=0.1780
+ throughput/total_tokens=190,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=992/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=190,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=993/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=190,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=994/500000]
+ train/ActionNoiseL2Loss=0.2112
+ throughput/total_tokens=190,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=995/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=191,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=996/500000]
+ train/ActionNoiseL2Loss=0.2149
+ throughput/total_tokens=191,232,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=997/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=191,424,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=998/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=191,616,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=999/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=191,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1000/500000]
+ optim/total_grad_norm=9.526
+ train/ActionNoiseL2Loss=0.1765
+ throughput/total_tokens=192,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/24 [14:24:40] INFO | >> Saving config... checkpoint.py:608
+09/24 [14:25:16] INFO | >> Saving model state... checkpoint.py:796
+09/24 [14:26:17] INFO | >> Saving optim state... checkpoint.py:811
+09/24 [14:26:22] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1001/500000]
+ train/ActionNoiseL2Loss=0.2270
+ throughput/total_tokens=192,192,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=1002/500000]
+ train/ActionNoiseL2Loss=0.2134
+ throughput/total_tokens=192,384,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=1003/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=192,576,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=1004/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=192,768,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=1005/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=192,960,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=1006/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=193,152,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=1007/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=193,344,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1008/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=193,536,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1009/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=193,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1010/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=193,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1011/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=194,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1012/500000]
+ train/ActionNoiseL2Loss=0.2027
+ throughput/total_tokens=194,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1013/500000]
+ train/ActionNoiseL2Loss=0.1800
+ throughput/total_tokens=194,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1014/500000]
+ train/ActionNoiseL2Loss=0.1570
+ throughput/total_tokens=194,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1015/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=194,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1016/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=195,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1017/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=195,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1018/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=195,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1019/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=195,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1020/500000]
+ optim/total_grad_norm=4.156
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=195,840,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1021/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=196,032,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1022/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=196,224,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1023/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=196,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1024/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=196,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1025/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=196,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1026/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=196,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1027/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=197,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1028/500000]
+ train/ActionNoiseL2Loss=0.1637
+ throughput/total_tokens=197,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1029/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=197,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1030/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=197,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1031/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=197,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1032/500000]
+ train/ActionNoiseL2Loss=0.1669
+ throughput/total_tokens=198,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1033/500000]
+ train/ActionNoiseL2Loss=0.1633
+ throughput/total_tokens=198,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1034/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=198,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1035/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=198,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1036/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=198,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1037/500000]
+ train/ActionNoiseL2Loss=0.1522
+ throughput/total_tokens=199,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1038/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=199,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1039/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=199,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1040/500000]
+ optim/total_grad_norm=5.026
+ train/ActionNoiseL2Loss=0.1772
+ throughput/total_tokens=199,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1041/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=199,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1042/500000]
+ train/ActionNoiseL2Loss=0.1295
+ throughput/total_tokens=200,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1043/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=200,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1044/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=200,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1045/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=200,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1046/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=200,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1047/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=201,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1048/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=201,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1049/500000]
+ train/ActionNoiseL2Loss=0.1603
+ throughput/total_tokens=201,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1050/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=201,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1051/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=201,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1052/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=201,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1053/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=202,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1054/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=202,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1055/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=202,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1056/500000]
+ train/ActionNoiseL2Loss=0.2327
+ throughput/total_tokens=202,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1057/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=202,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1058/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=203,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1059/500000]
+ train/ActionNoiseL2Loss=0.2095
+ throughput/total_tokens=203,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1060/500000]
+ optim/total_grad_norm=6.463
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=203,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1061/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=203,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1062/500000]
+ train/ActionNoiseL2Loss=0.1949
+ throughput/total_tokens=203,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1063/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=204,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1064/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=204,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1065/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=204,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1066/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=204,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1067/500000]
+ train/ActionNoiseL2Loss=0.2100
+ throughput/total_tokens=204,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1068/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=205,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1069/500000]
+ train/ActionNoiseL2Loss=0.2333
+ throughput/total_tokens=205,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1070/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=205,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1071/500000]
+ train/ActionNoiseL2Loss=0.1683
+ throughput/total_tokens=205,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1072/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=205,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1073/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=206,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1074/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=206,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1075/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=206,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1076/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=206,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1077/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=206,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1078/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=206,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1079/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=207,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1080/500000]
+ optim/total_grad_norm=5.768
+ train/ActionNoiseL2Loss=0.2023
+ throughput/total_tokens=207,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1081/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=207,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1082/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=207,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1083/500000]
+ train/ActionNoiseL2Loss=0.1678
+ throughput/total_tokens=207,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1084/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=208,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1085/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=208,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1086/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=208,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1087/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=208,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1088/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=208,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1089/500000]
+ train/ActionNoiseL2Loss=0.1659
+ throughput/total_tokens=209,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1090/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=209,280,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1091/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=209,472,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1092/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=209,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1093/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=209,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1094/500000]
+ train/ActionNoiseL2Loss=0.1613
+ throughput/total_tokens=210,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1095/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=210,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1096/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=210,432,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1097/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=210,624,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1098/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=210,816,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1099/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=211,008,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1100/500000]
+ optim/total_grad_norm=4.503
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=211,200,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1101/500000]
+ train/ActionNoiseL2Loss=0.1860
+ throughput/total_tokens=211,392,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1102/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=211,584,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1103/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=211,776,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1104/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=211,968,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1105/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=212,160,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1106/500000]
+ train/ActionNoiseL2Loss=0.2033
+ throughput/total_tokens=212,352,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1107/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=212,544,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1108/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=212,736,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1109/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=212,928,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1110/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=213,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1111/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=213,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1112/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=213,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1113/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=213,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1114/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=213,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1115/500000]
+ train/ActionNoiseL2Loss=0.2397
+ throughput/total_tokens=214,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1116/500000]
+ train/ActionNoiseL2Loss=0.2467
+ throughput/total_tokens=214,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1117/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=214,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1118/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=214,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1119/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=214,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1120/500000]
+ optim/total_grad_norm=4.042
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=215,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1121/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=215,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1122/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=215,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1123/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=215,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1124/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=215,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1125/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=216,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1126/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=216,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1127/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=216,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1128/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=216,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1129/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=216,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1130/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=216,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1131/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=217,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1132/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=217,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1133/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=217,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1134/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=217,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1135/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=217,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1136/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=218,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1137/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=218,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1138/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=218,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1139/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=218,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1140/500000]
+ optim/total_grad_norm=7.982
+ train/ActionNoiseL2Loss=0.1818
+ throughput/total_tokens=218,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1141/500000]
+ train/ActionNoiseL2Loss=0.2216
+ throughput/total_tokens=219,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1142/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=219,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1143/500000]
+ train/ActionNoiseL2Loss=0.1488
+ throughput/total_tokens=219,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1144/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=219,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1145/500000]
+ train/ActionNoiseL2Loss=0.2376
+ throughput/total_tokens=219,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1146/500000]
+ train/ActionNoiseL2Loss=0.1623
+ throughput/total_tokens=220,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1147/500000]
+ train/ActionNoiseL2Loss=0.2127
+ throughput/total_tokens=220,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1148/500000]
+ train/ActionNoiseL2Loss=0.1677
+ throughput/total_tokens=220,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1149/500000]
+ train/ActionNoiseL2Loss=0.1910
+ throughput/total_tokens=220,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1150/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=220,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1151/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=220,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1152/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=221,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1153/500000]
+ train/ActionNoiseL2Loss=0.1960
+ throughput/total_tokens=221,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1154/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=221,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1155/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=221,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1156/500000]
+ train/ActionNoiseL2Loss=0.2299
+ throughput/total_tokens=221,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1157/500000]
+ train/ActionNoiseL2Loss=0.1745
+ throughput/total_tokens=222,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1158/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=222,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1159/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=222,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1160/500000]
+ optim/total_grad_norm=3.402
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=222,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1161/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=222,912,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1162/500000]
+ train/ActionNoiseL2Loss=0.2145
+ throughput/total_tokens=223,104,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1163/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=223,296,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1164/500000]
+ train/ActionNoiseL2Loss=0.1573
+ throughput/total_tokens=223,488,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1165/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=223,680,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1166/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=223,872,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1167/500000]
+ train/ActionNoiseL2Loss=0.2187
+ throughput/total_tokens=224,064,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1168/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=224,256,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1169/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=224,448,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1170/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=224,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1171/500000]
+ train/ActionNoiseL2Loss=0.3848
+ throughput/total_tokens=224,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1172/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=225,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1173/500000]
+ train/ActionNoiseL2Loss=0.1553
+ throughput/total_tokens=225,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1174/500000]
+ train/ActionNoiseL2Loss=0.2425
+ throughput/total_tokens=225,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1175/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=225,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1176/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=225,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1177/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=225,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1178/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=226,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1179/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=226,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1180/500000]
+ optim/total_grad_norm=4.582
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=226,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1181/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=226,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1182/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=226,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1183/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=227,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1184/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=227,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1185/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=227,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1186/500000]
+ train/ActionNoiseL2Loss=0.1761
+ throughput/total_tokens=227,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1187/500000]
+ train/ActionNoiseL2Loss=0.1758
+ throughput/total_tokens=227,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1188/500000]
+ train/ActionNoiseL2Loss=0.2251
+ throughput/total_tokens=228,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1189/500000]
+ train/ActionNoiseL2Loss=0.2039
+ throughput/total_tokens=228,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1190/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=228,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1191/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=228,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1192/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=228,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1193/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=229,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1194/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=229,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1195/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=229,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1196/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=229,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1197/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=229,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1198/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=230,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1199/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=230,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1200/500000]
+ optim/total_grad_norm=3.700
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=230,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1201/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=230,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1202/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=230,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1203/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=230,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1204/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=231,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1205/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=231,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1206/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=231,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1207/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=231,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1208/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=231,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1209/500000]
+ train/ActionNoiseL2Loss=0.1417
+ throughput/total_tokens=232,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1210/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=232,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1211/500000]
+ train/ActionNoiseL2Loss=0.1837
+ throughput/total_tokens=232,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1212/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=232,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1213/500000]
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=232,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1214/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=233,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1215/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=233,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1216/500000]
+ train/ActionNoiseL2Loss=0.1492
+ throughput/total_tokens=233,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1217/500000]
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=233,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1218/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=233,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1219/500000]
+ train/ActionNoiseL2Loss=0.1934
+ throughput/total_tokens=234,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1220/500000]
+ optim/total_grad_norm=3.382
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=234,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1221/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=234,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1222/500000]
+ train/ActionNoiseL2Loss=0.1838
+ throughput/total_tokens=234,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1223/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=234,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1224/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=235,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1225/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=235,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1226/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=235,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1227/500000]
+ train/ActionNoiseL2Loss=0.1555
+ throughput/total_tokens=235,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1228/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=235,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1229/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=235,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1230/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=236,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1231/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=236,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1232/500000]
+ train/ActionNoiseL2Loss=0.2209
+ throughput/total_tokens=236,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1233/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=236,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1234/500000]
+ train/ActionNoiseL2Loss=0.1889
+ throughput/total_tokens=236,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1235/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=237,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1236/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=237,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1237/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=237,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1238/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=237,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1239/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=237,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1240/500000]
+ optim/total_grad_norm=4.140
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=238,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1241/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=238,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1242/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=238,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1243/500000]
+ train/ActionNoiseL2Loss=0.2245
+ throughput/total_tokens=238,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1244/500000]
+ train/ActionNoiseL2Loss=0.1707
+ throughput/total_tokens=238,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1245/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=239,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1246/500000]
+ train/ActionNoiseL2Loss=0.1657
+ throughput/total_tokens=239,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1247/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=239,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1248/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=239,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1249/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=239,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1250/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=240,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1251/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=240,192,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1252/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=240,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1253/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=240,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1254/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=240,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1255/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=240,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1256/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=241,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1257/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=241,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1258/500000]
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=241,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1259/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=241,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1260/500000]
+ optim/total_grad_norm=3.682
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=241,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1261/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=242,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1262/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=242,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1263/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=242,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1264/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=242,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1265/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=242,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1266/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=243,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1267/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=243,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1268/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=243,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1269/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=243,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1270/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=243,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1271/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=244,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1272/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=244,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1273/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=244,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1274/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=244,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1275/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=244,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1276/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=244,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1277/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=245,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1278/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=245,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1279/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=245,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1280/500000]
+ optim/total_grad_norm=3.976
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=245,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1281/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=245,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1282/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=246,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1283/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=246,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1284/500000]
+ train/ActionNoiseL2Loss=0.1868
+ throughput/total_tokens=246,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1285/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=246,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1286/500000]
+ train/ActionNoiseL2Loss=0.2017
+ throughput/total_tokens=246,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1287/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=247,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1288/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=247,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1289/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=247,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1290/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=247,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1291/500000]
+ train/ActionNoiseL2Loss=0.2403
+ throughput/total_tokens=247,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1292/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=248,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1293/500000]
+ train/ActionNoiseL2Loss=0.2273
+ throughput/total_tokens=248,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1294/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=248,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1295/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=248,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1296/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=248,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1297/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=249,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1298/500000]
+ train/ActionNoiseL2Loss=0.1700
+ throughput/total_tokens=249,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1299/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=249,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1300/500000]
+ optim/total_grad_norm=2.743
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=249,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1301/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=249,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1302/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=249,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1303/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=250,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1304/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=250,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1305/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=250,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1306/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=250,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1307/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=250,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1308/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=251,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1309/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=251,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1310/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=251,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1311/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=251,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1312/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=251,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1313/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=252,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1314/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=252,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1315/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=252,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1316/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=252,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1317/500000]
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=252,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1318/500000]
+ train/ActionNoiseL2Loss=0.1812
+ throughput/total_tokens=253,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1319/500000]
+ train/ActionNoiseL2Loss=0.1872
+ throughput/total_tokens=253,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1320/500000]
+ optim/total_grad_norm=5.200
+ train/ActionNoiseL2Loss=0.1348
+ throughput/total_tokens=253,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1321/500000]
+ train/ActionNoiseL2Loss=0.1686
+ throughput/total_tokens=253,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1322/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=253,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1323/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=254,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1324/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=254,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1325/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=254,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1326/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=254,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1327/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=254,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1328/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=254,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1329/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=255,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1330/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=255,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1331/500000]
+ train/ActionNoiseL2Loss=0.1731
+ throughput/total_tokens=255,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1332/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=255,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1333/500000]
+ train/ActionNoiseL2Loss=0.2102
+ throughput/total_tokens=255,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1334/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=256,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1335/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=256,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1336/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=256,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1337/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=256,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1338/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=256,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1339/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=257,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1340/500000]
+ optim/total_grad_norm=4.661
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=257,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1341/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=257,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1342/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=257,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1343/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=257,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1344/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=258,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1345/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=258,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1346/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=258,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1347/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=258,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1348/500000]
+ train/ActionNoiseL2Loss=0.2309
+ throughput/total_tokens=258,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1349/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=259,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1350/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=259,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1351/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=259,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1352/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=259,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1353/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=259,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1354/500000]
+ train/ActionNoiseL2Loss=0.1958
+ throughput/total_tokens=259,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1355/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=260,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1356/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=260,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1357/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=260,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1358/500000]
+ train/ActionNoiseL2Loss=0.2334
+ throughput/total_tokens=260,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1359/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=260,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1360/500000]
+ optim/total_grad_norm=5.854
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=261,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1361/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=261,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1362/500000]
+ train/ActionNoiseL2Loss=0.1404
+ throughput/total_tokens=261,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1363/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=261,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1364/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=261,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1365/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=262,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1366/500000]
+ train/ActionNoiseL2Loss=0.1532
+ throughput/total_tokens=262,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1367/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=262,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1368/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=262,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1369/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=262,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1370/500000]
+ train/ActionNoiseL2Loss=0.2762
+ throughput/total_tokens=263,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1371/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=263,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1372/500000]
+ train/ActionNoiseL2Loss=0.2447
+ throughput/total_tokens=263,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1373/500000]
+ train/ActionNoiseL2Loss=0.1930
+ throughput/total_tokens=263,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1374/500000]
+ train/ActionNoiseL2Loss=0.1855
+ throughput/total_tokens=263,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1375/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=264,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1376/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=264,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1377/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=264,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1378/500000]
+ train/ActionNoiseL2Loss=0.1505
+ throughput/total_tokens=264,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1379/500000]
+ train/ActionNoiseL2Loss=0.1545
+ throughput/total_tokens=264,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1380/500000]
+ optim/total_grad_norm=4.003
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=264,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1381/500000]
+ train/ActionNoiseL2Loss=0.1887
+ throughput/total_tokens=265,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1382/500000]
+ train/ActionNoiseL2Loss=0.2588
+ throughput/total_tokens=265,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1383/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=265,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1384/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=265,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1385/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=265,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1386/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=266,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1387/500000]
+ train/ActionNoiseL2Loss=0.1461
+ throughput/total_tokens=266,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1388/500000]
+ train/ActionNoiseL2Loss=0.1715
+ throughput/total_tokens=266,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1389/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=266,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1390/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=266,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1391/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=267,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1392/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=267,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1393/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=267,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1394/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=267,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1395/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=267,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1396/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=268,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1397/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=268,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1398/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=268,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1399/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=268,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1400/500000]
+ optim/total_grad_norm=4.275
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=268,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1401/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=268,992,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1402/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=269,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1403/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=269,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1404/500000]
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=269,568,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1405/500000]
+ train/ActionNoiseL2Loss=0.1463
+ throughput/total_tokens=269,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1406/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=269,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1407/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=270,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1408/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=270,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1409/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=270,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1410/500000]
+ train/ActionNoiseL2Loss=0.1935
+ throughput/total_tokens=270,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1411/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=270,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1412/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=271,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1413/500000]
+ train/ActionNoiseL2Loss=0.2312
+ throughput/total_tokens=271,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1414/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=271,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1415/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=271,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1416/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=271,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1417/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=272,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1418/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=272,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1419/500000]
+ train/ActionNoiseL2Loss=0.1929
+ throughput/total_tokens=272,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1420/500000]
+ optim/total_grad_norm=4.556
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=272,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1421/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=272,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1422/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=273,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1423/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=273,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1424/500000]
+ train/ActionNoiseL2Loss=0.2119
+ throughput/total_tokens=273,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1425/500000]
+ train/ActionNoiseL2Loss=0.1707
+ throughput/total_tokens=273,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1426/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=273,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1427/500000]
+ train/ActionNoiseL2Loss=0.1324
+ throughput/total_tokens=273,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1428/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=274,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1429/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=274,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1430/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=274,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1431/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=274,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1432/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=274,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1433/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=275,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1434/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=275,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1435/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=275,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1436/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=275,712,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1437/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=275,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1438/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=276,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1439/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=276,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1440/500000]
+ optim/total_grad_norm=4.074
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=276,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1441/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=276,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1442/500000]
+ train/ActionNoiseL2Loss=0.1950
+ throughput/total_tokens=276,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1443/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=277,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1444/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=277,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1445/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=277,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1446/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=277,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1447/500000]
+ train/ActionNoiseL2Loss=0.1698
+ throughput/total_tokens=277,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1448/500000]
+ train/ActionNoiseL2Loss=0.1607
+ throughput/total_tokens=278,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1449/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=278,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1450/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=278,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1451/500000]
+ train/ActionNoiseL2Loss=0.1807
+ throughput/total_tokens=278,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1452/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=278,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1453/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=278,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1454/500000]
+ train/ActionNoiseL2Loss=0.1863
+ throughput/total_tokens=279,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1455/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=279,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1456/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=279,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1457/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=279,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1458/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=279,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1459/500000]
+ train/ActionNoiseL2Loss=0.1607
+ throughput/total_tokens=280,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1460/500000]
+ optim/total_grad_norm=6.260
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=280,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1461/500000]
+ train/ActionNoiseL2Loss=0.2071
+ throughput/total_tokens=280,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1462/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=280,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1463/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=280,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1464/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=281,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1465/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=281,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1466/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=281,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1467/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=281,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1468/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=281,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1469/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=282,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1470/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=282,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1471/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=282,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1472/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=282,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1473/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=282,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1474/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=283,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1475/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=283,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1476/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=283,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1477/500000]
+ train/ActionNoiseL2Loss=0.1488
+ throughput/total_tokens=283,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1478/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=283,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1479/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=283,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1480/500000]
+ optim/total_grad_norm=3.063
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=284,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1481/500000]
+ train/ActionNoiseL2Loss=0.1417
+ throughput/total_tokens=284,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1482/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=284,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1483/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=284,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1484/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=284,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1485/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=285,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1486/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=285,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1487/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=285,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1488/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=285,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1489/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=285,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1490/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=286,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1491/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=286,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1492/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=286,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1493/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=286,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1494/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=286,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1495/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=287,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1496/500000]
+ train/ActionNoiseL2Loss=0.1590
+ throughput/total_tokens=287,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1497/500000]
+ train/ActionNoiseL2Loss=0.1667
+ throughput/total_tokens=287,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1498/500000]
+ train/ActionNoiseL2Loss=0.1833
+ throughput/total_tokens=287,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1499/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=287,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1500/500000]
+ optim/total_grad_norm=4.397
+ train/ActionNoiseL2Loss=0.1755
+ throughput/total_tokens=288,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/24 [17:24:52] INFO | >> Saving config... checkpoint.py:608
+09/24 [17:25:26] INFO | >> Saving model state... checkpoint.py:796
+09/24 [17:26:29] INFO | >> Saving optim state... checkpoint.py:811
+09/24 [17:26:34] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1501/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=288,192,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=1502/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=288,384,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1503/500000]
+ train/ActionNoiseL2Loss=0.1777
+ throughput/total_tokens=288,576,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1504/500000]
+ train/ActionNoiseL2Loss=0.2060
+ throughput/total_tokens=288,768,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=1505/500000]
+ train/ActionNoiseL2Loss=0.1523
+ throughput/total_tokens=288,960,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0473
+[step=1506/500000]
+ train/ActionNoiseL2Loss=0.2590
+ throughput/total_tokens=289,152,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=1507/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=289,344,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=1508/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=289,536,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=1509/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=289,728,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=1510/500000]
+ train/ActionNoiseL2Loss=0.1868
+ throughput/total_tokens=289,920,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+ System/Peak GPU Memory (MB)=44,437
+[step=1511/500000]
+ train/ActionNoiseL2Loss=0.1257
+ throughput/total_tokens=290,112,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=1512/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=290,304,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=1513/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=290,496,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=1514/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=290,688,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=1515/500000]
+ train/ActionNoiseL2Loss=0.1683
+ throughput/total_tokens=290,880,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=1516/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=291,072,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=1517/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=291,264,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1518/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=291,456,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1519/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=291,648,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1520/500000]
+ optim/total_grad_norm=3.750
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=291,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1521/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=292,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1522/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=292,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1523/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=292,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1524/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=292,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1525/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=292,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1526/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=292,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1527/500000]
+ train/ActionNoiseL2Loss=0.1417
+ throughput/total_tokens=293,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1528/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=293,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1529/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=293,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1530/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=293,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1531/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=293,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1532/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=294,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1533/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=294,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1534/500000]
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=294,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1535/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=294,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1536/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=294,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1537/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=295,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1538/500000]
+ train/ActionNoiseL2Loss=0.1864
+ throughput/total_tokens=295,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1539/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=295,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1540/500000]
+ optim/total_grad_norm=3.842
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=295,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1541/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=295,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1542/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=296,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1543/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=296,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1544/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=296,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1545/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=296,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1546/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=296,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1547/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=297,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1548/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=297,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1549/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=297,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1550/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=297,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1551/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=297,792,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=1552/500000]
+ train/ActionNoiseL2Loss=0.1584
+ throughput/total_tokens=297,984,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=1553/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=298,176,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=1554/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=298,368,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=1555/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=298,560,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1556/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=298,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1557/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=298,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1558/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=299,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1559/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=299,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1560/500000]
+ optim/total_grad_norm=2.852
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=299,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1561/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=299,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1562/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=299,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1563/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=300,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1564/500000]
+ train/ActionNoiseL2Loss=0.1455
+ throughput/total_tokens=300,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1565/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=300,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1566/500000]
+ train/ActionNoiseL2Loss=0.1540
+ throughput/total_tokens=300,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1567/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=300,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1568/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=301,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1569/500000]
+ train/ActionNoiseL2Loss=0.2239
+ throughput/total_tokens=301,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1570/500000]
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=301,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1571/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=301,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1572/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=301,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1573/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=302,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1574/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=302,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1575/500000]
+ train/ActionNoiseL2Loss=0.1601
+ throughput/total_tokens=302,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1576/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=302,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1577/500000]
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=302,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1578/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=302,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1579/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=303,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1580/500000]
+ optim/total_grad_norm=4.052
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=303,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1581/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=303,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1582/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=303,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1583/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=303,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1584/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=304,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1585/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=304,320,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1586/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=304,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1587/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=304,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1588/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=304,896,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1589/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=305,088,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1590/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=305,280,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1591/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=305,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1592/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=305,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1593/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=305,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1594/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=306,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1595/500000]
+ train/ActionNoiseL2Loss=0.1812
+ throughput/total_tokens=306,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1596/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=306,432,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1597/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=306,624,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1598/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=306,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1599/500000]
+ train/ActionNoiseL2Loss=0.1675
+ throughput/total_tokens=307,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1600/500000]
+ optim/total_grad_norm=4.320
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=307,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1601/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=307,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1602/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=307,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1603/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=307,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1604/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=307,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1605/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=308,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1606/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=308,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1607/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=308,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1608/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=308,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1609/500000]
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=308,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1610/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=309,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1611/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=309,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1612/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=309,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1613/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=309,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1614/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=309,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1615/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=310,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1616/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=310,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1617/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=310,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1618/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=310,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1619/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=310,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1620/500000]
+ optim/total_grad_norm=2.617
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=311,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1621/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=311,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1622/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=311,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1623/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=311,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1624/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=311,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1625/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=312,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1626/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=312,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1627/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=312,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1628/500000]
+ train/ActionNoiseL2Loss=0.1999
+ throughput/total_tokens=312,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1629/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=312,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1630/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=312,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1631/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=313,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1632/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=313,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1633/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=313,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1634/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=313,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1635/500000]
+ train/ActionNoiseL2Loss=0.1419
+ throughput/total_tokens=313,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1636/500000]
+ train/ActionNoiseL2Loss=0.1638
+ throughput/total_tokens=314,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1637/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=314,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1638/500000]
+ train/ActionNoiseL2Loss=0.2028
+ throughput/total_tokens=314,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1639/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=314,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1640/500000]
+ optim/total_grad_norm=3.960
+ train/ActionNoiseL2Loss=0.1431
+ throughput/total_tokens=314,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1641/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=315,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1642/500000]
+ train/ActionNoiseL2Loss=0.2435
+ throughput/total_tokens=315,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1643/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=315,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1644/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=315,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1645/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=315,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1646/500000]
+ train/ActionNoiseL2Loss=0.1191
+ throughput/total_tokens=316,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1647/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=316,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1648/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=316,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1649/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=316,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1650/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=316,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1651/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=316,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1652/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=317,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1653/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=317,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1654/500000]
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=317,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1655/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=317,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1656/500000]
+ train/ActionNoiseL2Loss=0.1594
+ throughput/total_tokens=317,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1657/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=318,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1658/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=318,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1659/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=318,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1660/500000]
+ optim/total_grad_norm=2.592
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=318,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1661/500000]
+ train/ActionNoiseL2Loss=0.1853
+ throughput/total_tokens=318,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1662/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=319,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1663/500000]
+ train/ActionNoiseL2Loss=0.2090
+ throughput/total_tokens=319,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1664/500000]
+ train/ActionNoiseL2Loss=0.1960
+ throughput/total_tokens=319,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1665/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=319,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1666/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=319,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1667/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=320,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1668/500000]
+ train/ActionNoiseL2Loss=0.1848
+ throughput/total_tokens=320,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1669/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=320,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1670/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=320,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1671/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=320,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1672/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=321,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1673/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=321,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1674/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=321,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1675/500000]
+ train/ActionNoiseL2Loss=0.1490
+ throughput/total_tokens=321,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1676/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=321,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1677/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=321,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1678/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=322,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1679/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=322,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1680/500000]
+ optim/total_grad_norm=2.830
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=322,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1681/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=322,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1682/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=322,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1683/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=323,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1684/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=323,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1685/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=323,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1686/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=323,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1687/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=323,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1688/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=324,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1689/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=324,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1690/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=324,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1691/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=324,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1692/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=324,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1693/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=325,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1694/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=325,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1695/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=325,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1696/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=325,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1697/500000]
+ train/ActionNoiseL2Loss=0.1642
+ throughput/total_tokens=325,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1698/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=326,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1699/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=326,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1700/500000]
+ optim/total_grad_norm=4.174
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=326,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1701/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=326,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1702/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=326,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1703/500000]
+ train/ActionNoiseL2Loss=0.1457
+ throughput/total_tokens=326,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1704/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=327,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1705/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=327,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1706/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=327,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1707/500000]
+ train/ActionNoiseL2Loss=0.1469
+ throughput/total_tokens=327,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1708/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=327,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1709/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=328,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1710/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=328,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1711/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=328,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1712/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=328,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1713/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=328,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1714/500000]
+ train/ActionNoiseL2Loss=0.1970
+ throughput/total_tokens=329,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1715/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=329,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1716/500000]
+ train/ActionNoiseL2Loss=0.1558
+ throughput/total_tokens=329,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1717/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=329,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1718/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=329,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1719/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=330,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1720/500000]
+ optim/total_grad_norm=3.416
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=330,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1721/500000]
+ train/ActionNoiseL2Loss=0.1835
+ throughput/total_tokens=330,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1722/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=330,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1723/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=330,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1724/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=331,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1725/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=331,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1726/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=331,392,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1727/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=331,584,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1728/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=331,776,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1729/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=331,968,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1730/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=332,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1731/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=332,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1732/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=332,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1733/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=332,736,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1734/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=332,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1735/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=333,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1736/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=333,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1737/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=333,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1738/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=333,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1739/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=333,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1740/500000]
+ optim/total_grad_norm=2.465
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=334,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1741/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=334,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1742/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=334,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1743/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=334,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1744/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=334,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1745/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=335,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1746/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=335,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1747/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=335,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1748/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=335,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1749/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=335,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1750/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=336,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1751/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=336,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1752/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=336,384,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1753/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=336,576,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1754/500000]
+ train/ActionNoiseL2Loss=0.1191
+ throughput/total_tokens=336,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1755/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=336,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1756/500000]
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=337,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1757/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=337,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1758/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=337,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1759/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=337,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1760/500000]
+ optim/total_grad_norm=2.459
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=337,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1761/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=338,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1762/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=338,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1763/500000]
+ train/ActionNoiseL2Loss=0.1532
+ throughput/total_tokens=338,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1764/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=338,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1765/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=338,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1766/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=339,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1767/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=339,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1768/500000]
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=339,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1769/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=339,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1770/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=339,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1771/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=340,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1772/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=340,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1773/500000]
+ train/ActionNoiseL2Loss=0.2243
+ throughput/total_tokens=340,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1774/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=340,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1775/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=340,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1776/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=340,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1777/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=341,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1778/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=341,376,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1779/500000]
+ train/ActionNoiseL2Loss=0.1684
+ throughput/total_tokens=341,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1780/500000]
+ optim/total_grad_norm=3.857
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=341,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1781/500000]
+ train/ActionNoiseL2Loss=0.1568
+ throughput/total_tokens=341,952,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1782/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=342,144,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1783/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=342,336,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1784/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=342,528,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1785/500000]
+ train/ActionNoiseL2Loss=0.1726
+ throughput/total_tokens=342,720,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1786/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=342,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1787/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=343,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1788/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=343,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1789/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=343,488,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1790/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=343,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1791/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=343,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1792/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=344,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1793/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=344,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1794/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=344,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1795/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=344,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1796/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=344,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1797/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=345,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1798/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=345,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1799/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=345,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1800/500000]
+ optim/total_grad_norm=2.821
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=345,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1801/500000]
+ train/ActionNoiseL2Loss=0.1701
+ throughput/total_tokens=345,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1802/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=345,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1803/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=346,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1804/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=346,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1805/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=346,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1806/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=346,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1807/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=346,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1808/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=347,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1809/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=347,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1810/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=347,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1811/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=347,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1812/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=347,904,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1813/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=348,096,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1814/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=348,288,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1815/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=348,480,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1816/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=348,672,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1817/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=348,864,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1818/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=349,056,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1819/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=349,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1820/500000]
+ optim/total_grad_norm=2.703
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=349,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1821/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=349,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1822/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=349,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1823/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=350,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1824/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=350,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1825/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=350,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1826/500000]
+ train/ActionNoiseL2Loss=0.1698
+ throughput/total_tokens=350,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1827/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=350,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1828/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=350,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1829/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=351,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1830/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=351,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1831/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=351,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1832/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=351,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1833/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=351,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1834/500000]
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=352,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1835/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=352,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1836/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=352,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1837/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=352,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1838/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=352,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1839/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=353,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1840/500000]
+ optim/total_grad_norm=3.497
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=353,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1841/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=353,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1842/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=353,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1843/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=353,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1844/500000]
+ train/ActionNoiseL2Loss=0.1910
+ throughput/total_tokens=354,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1845/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=354,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1846/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=354,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1847/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=354,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1848/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=354,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1849/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=355,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1850/500000]
+ train/ActionNoiseL2Loss=0.1653
+ throughput/total_tokens=355,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1851/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=355,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1852/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=355,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1853/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=355,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1854/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=355,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1855/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=356,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1856/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=356,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1857/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=356,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1858/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=356,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1859/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=356,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1860/500000]
+ optim/total_grad_norm=4.399
+ train/ActionNoiseL2Loss=0.2137
+ throughput/total_tokens=357,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1861/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=357,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1862/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=357,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1863/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=357,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1864/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=357,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1865/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=358,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1866/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=358,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1867/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=358,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1868/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=358,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1869/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=358,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1870/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=359,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1871/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=359,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1872/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=359,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1873/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=359,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1874/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=359,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1875/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=360,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1876/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=360,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1877/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=360,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1878/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=360,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1879/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=360,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=1880/500000]
+ optim/total_grad_norm=2.154
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=360,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1881/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=361,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1882/500000]
+ train/ActionNoiseL2Loss=0.1367
+ throughput/total_tokens=361,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1883/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=361,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1884/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=361,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1885/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=361,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1886/500000]
+ train/ActionNoiseL2Loss=0.1721
+ throughput/total_tokens=362,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1887/500000]
+ train/ActionNoiseL2Loss=0.1257
+ throughput/total_tokens=362,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1888/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=362,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1889/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=362,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1890/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=362,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1891/500000]
+ train/ActionNoiseL2Loss=0.1978
+ throughput/total_tokens=363,072,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1892/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=363,264,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1893/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=363,456,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1894/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=363,648,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1895/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=363,840,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1896/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=364,032,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1897/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=364,224,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1898/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=364,416,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1899/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=364,608,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=1900/500000]
+ optim/total_grad_norm=1.812
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=364,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1901/500000]
+ train/ActionNoiseL2Loss=0.2110
+ throughput/total_tokens=364,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1902/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=365,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1903/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=365,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1904/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=365,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=1905/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=365,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1906/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=365,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1907/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=366,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1908/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=366,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1909/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=366,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1910/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=366,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1911/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=366,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1912/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=367,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1913/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=367,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1914/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=367,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1915/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=367,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1916/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=367,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1917/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=368,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1918/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=368,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1919/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=368,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1920/500000]
+ optim/total_grad_norm=2.061
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=368,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1921/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=368,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1922/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=369,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1923/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=369,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1924/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=369,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1925/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=369,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1926/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=369,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1927/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=369,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1928/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=370,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1929/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=370,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1930/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=370,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1931/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=370,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1932/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=370,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1933/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=371,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1934/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=371,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1935/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=371,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1936/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=371,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1937/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=371,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1938/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=372,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1939/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=372,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1940/500000]
+ optim/total_grad_norm=4.143
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=372,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1941/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=372,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1942/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=372,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1943/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=373,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1944/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=373,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1945/500000]
+ train/ActionNoiseL2Loss=0.1627
+ throughput/total_tokens=373,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1946/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=373,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1947/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=373,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1948/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=374,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1949/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=374,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1950/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=374,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1951/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=374,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1952/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=374,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1953/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=374,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=1954/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=375,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1955/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=375,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1956/500000]
+ train/ActionNoiseL2Loss=0.1411
+ throughput/total_tokens=375,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1957/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=375,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1958/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=375,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1959/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=376,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1960/500000]
+ optim/total_grad_norm=3.504
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=376,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=1961/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=376,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1962/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=376,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1963/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=376,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1964/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=377,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1965/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=377,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1966/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=377,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1967/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=377,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1968/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=377,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1969/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=378,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=1970/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=378,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=1971/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=378,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1972/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=378,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1973/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=378,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1974/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=379,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1975/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=379,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1976/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=379,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1977/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=379,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1978/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=379,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1979/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=379,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1980/500000]
+ optim/total_grad_norm=2.768
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=380,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1981/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=380,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1982/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=380,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1983/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=380,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1984/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=380,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1985/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=381,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1986/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=381,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1987/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=381,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1988/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=381,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1989/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=381,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1990/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=382,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=1991/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=382,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1992/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=382,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1993/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=382,656,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1994/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=382,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=1995/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=383,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=1996/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=383,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1997/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=383,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1998/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=383,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=1999/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=383,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2000/500000]
+ optim/total_grad_norm=3.270
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=384,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/24 [20:25:06] INFO | >> Saving config... checkpoint.py:608
+09/24 [20:25:37] INFO | >> Saving model state... checkpoint.py:796
+09/24 [20:26:38] INFO | >> Saving optim state... checkpoint.py:811
+09/24 [20:26:42] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2001/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=384,192,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=2002/500000]
+ train/ActionNoiseL2Loss=0.2103
+ throughput/total_tokens=384,384,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2003/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=384,576,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=2004/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=384,768,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=2005/500000]
+ train/ActionNoiseL2Loss=0.1479
+ throughput/total_tokens=384,960,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=2006/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=385,152,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=2007/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=385,344,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=2008/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=385,536,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=2009/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=385,728,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=2010/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=385,920,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+ System/Peak GPU Memory (MB)=44,437
+[step=2011/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=386,112,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=2012/500000]
+ train/ActionNoiseL2Loss=0.1938
+ throughput/total_tokens=386,304,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=2013/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=386,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2014/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=386,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2015/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=386,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2016/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=387,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2017/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=387,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2018/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=387,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2019/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=387,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2020/500000]
+ optim/total_grad_norm=2.251
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=387,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2021/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=388,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2022/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=388,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2023/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=388,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2024/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=388,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2025/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=388,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2026/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=388,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2027/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=389,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2028/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=389,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2029/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=389,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2030/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=389,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2031/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=389,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2032/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=390,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2033/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=390,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2034/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=390,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2035/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=390,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2036/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=390,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2037/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=391,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2038/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=391,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2039/500000]
+ train/ActionNoiseL2Loss=0.1641
+ throughput/total_tokens=391,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2040/500000]
+ optim/total_grad_norm=3.910
+ train/ActionNoiseL2Loss=0.1846
+ throughput/total_tokens=391,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2041/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=391,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2042/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=392,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2043/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=392,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2044/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=392,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2045/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=392,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2046/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=392,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2047/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=393,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2048/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=393,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2049/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=393,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2050/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=393,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2051/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=393,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2052/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=393,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2053/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=394,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2054/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=394,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2055/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=394,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2056/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=394,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2057/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=394,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2058/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=395,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2059/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=395,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2060/500000]
+ optim/total_grad_norm=2.693
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=395,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2061/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=395,712,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2062/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=395,904,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2063/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=396,096,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2064/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=396,288,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2065/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=396,480,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2066/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=396,672,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2067/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=396,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2068/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=397,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2069/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=397,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2070/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=397,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2071/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=397,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2072/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=397,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2073/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=398,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2074/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=398,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2075/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=398,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2076/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=398,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2077/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=398,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2078/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=398,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2079/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=399,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2080/500000]
+ optim/total_grad_norm=3.254
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=399,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2081/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=399,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2082/500000]
+ train/ActionNoiseL2Loss=0.1721
+ throughput/total_tokens=399,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2083/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=399,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2084/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=400,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2085/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=400,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2086/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=400,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2087/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=400,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2088/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=400,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2089/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=401,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2090/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=401,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2091/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=401,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2092/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=401,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2093/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=401,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2094/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=402,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2095/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=402,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2096/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=402,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2097/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=402,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2098/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=402,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2099/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=403,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2100/500000]
+ optim/total_grad_norm=1.948
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=403,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2101/500000]
+ train/ActionNoiseL2Loss=0.2146
+ throughput/total_tokens=403,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2102/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=403,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2103/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=403,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2104/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=403,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2105/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=404,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2106/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=404,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2107/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=404,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2108/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=404,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2109/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=404,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2110/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=405,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2111/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=405,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2112/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=405,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2113/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=405,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2114/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=405,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2115/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=406,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2116/500000]
+ train/ActionNoiseL2Loss=0.1549
+ throughput/total_tokens=406,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2117/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=406,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2118/500000]
+ train/ActionNoiseL2Loss=0.1633
+ throughput/total_tokens=406,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2119/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=406,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2120/500000]
+ optim/total_grad_norm=1.820
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=407,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2121/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=407,232,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2122/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=407,424,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2123/500000]
+ train/ActionNoiseL2Loss=0.1532
+ throughput/total_tokens=407,616,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2124/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=407,808,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2125/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=408,000,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2126/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=408,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2127/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=408,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2128/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=408,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2129/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=408,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2130/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=408,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2131/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=409,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2132/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=409,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2133/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=409,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2134/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=409,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2135/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=409,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2136/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=410,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2137/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=410,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2138/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=410,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2139/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=410,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2140/500000]
+ optim/total_grad_norm=2.495
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=410,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2141/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=411,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2142/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=411,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2143/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=411,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2144/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=411,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2145/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=411,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2146/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=412,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2147/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=412,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2148/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=412,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2149/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=412,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2150/500000]
+ train/ActionNoiseL2Loss=0.2501
+ throughput/total_tokens=412,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2151/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=412,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2152/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=413,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2153/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=413,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2154/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=413,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2155/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=413,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2156/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=413,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2157/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=414,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2158/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=414,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2159/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=414,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2160/500000]
+ optim/total_grad_norm=1.980
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=414,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2161/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=414,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2162/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=415,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2163/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=415,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2164/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=415,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2165/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=415,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2166/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=415,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2167/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=416,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2168/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=416,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2169/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=416,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2170/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=416,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2171/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=416,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2172/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=417,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2173/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=417,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2174/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=417,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2175/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=417,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2176/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=417,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2177/500000]
+ train/ActionNoiseL2Loss=0.1908
+ throughput/total_tokens=417,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2178/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=418,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2179/500000]
+ train/ActionNoiseL2Loss=0.1647
+ throughput/total_tokens=418,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2180/500000]
+ optim/total_grad_norm=2.901
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=418,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2181/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=418,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2182/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=418,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2183/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=419,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2184/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=419,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2185/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=419,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2186/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=419,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2187/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=419,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2188/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=420,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2189/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=420,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2190/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=420,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2191/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=420,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2192/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=420,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2193/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=421,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2194/500000]
+ train/ActionNoiseL2Loss=0.1763
+ throughput/total_tokens=421,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2195/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=421,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2196/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=421,632,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2197/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=421,824,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2198/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=422,016,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2199/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=422,208,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2200/500000]
+ optim/total_grad_norm=1.760
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=422,400,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2201/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=422,592,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2202/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=422,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2203/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=422,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2204/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=423,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2205/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=423,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2206/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=423,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2207/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=423,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2208/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=423,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2209/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=424,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2210/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=424,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2211/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=424,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2212/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=424,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2213/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=424,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2214/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=425,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2215/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=425,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2216/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=425,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2217/500000]
+ train/ActionNoiseL2Loss=0.1393
+ throughput/total_tokens=425,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2218/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=425,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2219/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=426,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2220/500000]
+ optim/total_grad_norm=2.064
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=426,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2221/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=426,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2222/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=426,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2223/500000]
+ train/ActionNoiseL2Loss=0.1463
+ throughput/total_tokens=426,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2224/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=427,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2225/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=427,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2226/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=427,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2227/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=427,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2228/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=427,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2229/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=427,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2230/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=428,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2231/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=428,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2232/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=428,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2233/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=428,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2234/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=428,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2235/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=429,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2236/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=429,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2237/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=429,504,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2238/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=429,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2239/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=429,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2240/500000]
+ optim/total_grad_norm=2.572
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=430,080,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2241/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=430,272,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2242/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=430,464,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2243/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=430,656,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2244/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=430,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2245/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=431,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2246/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=431,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2247/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=431,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2248/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=431,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2249/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=431,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2250/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=432,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2251/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=432,192,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2252/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=432,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2253/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=432,576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2254/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=432,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2255/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=432,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2256/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=433,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2257/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=433,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2258/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=433,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2259/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=433,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2260/500000]
+ optim/total_grad_norm=2.117
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=433,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2261/500000]
+ train/ActionNoiseL2Loss=0.1609
+ throughput/total_tokens=434,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2262/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=434,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2263/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=434,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2264/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=434,688,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2265/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=434,880,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2266/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=435,072,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2267/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=435,264,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2268/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=435,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2269/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=435,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2270/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=435,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2271/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=436,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2272/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=436,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2273/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=436,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2274/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=436,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2275/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=436,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2276/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=436,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2277/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=437,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2278/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=437,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2279/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=437,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2280/500000]
+ optim/total_grad_norm=1.294
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=437,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2281/500000]
+ train/ActionNoiseL2Loss=0.1558
+ throughput/total_tokens=437,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2282/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=438,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2283/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=438,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2284/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=438,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2285/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=438,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2286/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=438,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2287/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=439,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2288/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=439,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2289/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=439,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2290/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=439,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2291/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=439,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2292/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=440,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2293/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=440,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2294/500000]
+ train/ActionNoiseL2Loss=0.1678
+ throughput/total_tokens=440,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2295/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=440,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2296/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=440,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2297/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=441,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2298/500000]
+ train/ActionNoiseL2Loss=0.1375
+ throughput/total_tokens=441,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2299/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=441,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2300/500000]
+ optim/total_grad_norm=3.627
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=441,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2301/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=441,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2302/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=441,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2303/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=442,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2304/500000]
+ train/ActionNoiseL2Loss=0.1689
+ throughput/total_tokens=442,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2305/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=442,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2306/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=442,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2307/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=442,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2308/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=443,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2309/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=443,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2310/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=443,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2311/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=443,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2312/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=443,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2313/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=444,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2314/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=444,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2315/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=444,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2316/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=444,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2317/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=444,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2318/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=445,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2319/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=445,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2320/500000]
+ optim/total_grad_norm=1.705
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=445,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2321/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=445,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2322/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=445,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2323/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=446,016,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2324/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=446,208,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2325/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=446,400,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2326/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=446,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2327/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=446,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2328/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=446,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2329/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=447,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2330/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=447,360,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2331/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=447,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2332/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=447,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2333/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=447,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2334/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=448,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2335/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=448,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2336/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=448,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2337/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=448,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2338/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=448,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2339/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=449,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2340/500000]
+ optim/total_grad_norm=2.413
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=449,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2341/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=449,472,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2342/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=449,664,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2343/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=449,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2344/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=450,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2345/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=450,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2346/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=450,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2347/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=450,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2348/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=450,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2349/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=451,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2350/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=451,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2351/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=451,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2352/500000]
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=451,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2353/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=451,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2354/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=451,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2355/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=452,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2356/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=452,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2357/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=452,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2358/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=452,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2359/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=452,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2360/500000]
+ optim/total_grad_norm=2.908
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=453,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2361/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=453,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2362/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=453,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2363/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=453,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2364/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=453,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2365/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=454,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2366/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=454,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2367/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=454,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2368/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=454,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2369/500000]
+ train/ActionNoiseL2Loss=0.1539
+ throughput/total_tokens=454,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2370/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=455,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2371/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=455,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2372/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=455,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2373/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=455,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2374/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=455,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2375/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=456,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2376/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=456,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2377/500000]
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=456,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2378/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=456,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2379/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=456,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2380/500000]
+ optim/total_grad_norm=2.053
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=456,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2381/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=457,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2382/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=457,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2383/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=457,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2384/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=457,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2385/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=457,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2386/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=458,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2387/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=458,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2388/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=458,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2389/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=458,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2390/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=458,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2391/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=459,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2392/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=459,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2393/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=459,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2394/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=459,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2395/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=459,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2396/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=460,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2397/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=460,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2398/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=460,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2399/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=460,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2400/500000]
+ optim/total_grad_norm=2.381
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=460,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2401/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=460,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2402/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=461,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2403/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=461,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2404/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=461,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2405/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=461,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2406/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=461,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2407/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=462,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2408/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=462,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2409/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=462,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2410/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=462,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2411/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=462,912,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2412/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=463,104,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2413/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=463,296,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2414/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=463,488,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2415/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=463,680,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2416/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=463,872,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2417/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=464,064,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2418/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=464,256,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2419/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=464,448,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2420/500000]
+ optim/total_grad_norm=2.468
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=464,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2421/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=464,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2422/500000]
+ train/ActionNoiseL2Loss=0.1386
+ throughput/total_tokens=465,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2423/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=465,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2424/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=465,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2425/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=465,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2426/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=465,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2427/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=465,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2428/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=466,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2429/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=466,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2430/500000]
+ train/ActionNoiseL2Loss=0.1761
+ throughput/total_tokens=466,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2431/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=466,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2432/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=466,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2433/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=467,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2434/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=467,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2435/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=467,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2436/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=467,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2437/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=467,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2438/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=468,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2439/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=468,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2440/500000]
+ optim/total_grad_norm=2.260
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=468,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2441/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=468,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2442/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=468,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2443/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=469,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2444/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=469,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2445/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=469,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2446/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=469,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2447/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=469,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2448/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=470,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2449/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=470,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2450/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=470,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2451/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=470,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2452/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=470,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2453/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=470,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2454/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=471,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2455/500000]
+ train/ActionNoiseL2Loss=0.1624
+ throughput/total_tokens=471,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2456/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=471,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2457/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=471,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2458/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=471,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2459/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=472,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2460/500000]
+ optim/total_grad_norm=1.943
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=472,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2461/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=472,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2462/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=472,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2463/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=472,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2464/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=473,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2465/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=473,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2466/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=473,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2467/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=473,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2468/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=473,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2469/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=474,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2470/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=474,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2471/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=474,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2472/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=474,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2473/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=474,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2474/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=475,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2475/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=475,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2476/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=475,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2477/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=475,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2478/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=475,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2479/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=475,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2480/500000]
+ optim/total_grad_norm=1.812
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=476,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2481/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=476,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2482/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=476,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2483/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=476,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2484/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=476,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2485/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=477,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2486/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=477,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2487/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=477,504,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2488/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=477,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2489/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=477,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2490/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=478,080,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2491/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=478,272,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2492/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=478,464,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2493/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=478,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2494/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=478,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2495/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=479,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2496/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=479,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2497/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=479,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2498/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=479,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2499/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=479,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2500/500000]
+ optim/total_grad_norm=1.770
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=480,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/24 [23:25:15] INFO | >> Saving config... checkpoint.py:608
+09/24 [23:25:51] INFO | >> Saving model state... checkpoint.py:796
+09/24 [23:26:51] INFO | >> Saving optim state... checkpoint.py:811
+09/24 [23:26:56] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2501/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=480,192,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=2502/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=480,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2503/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=480,576,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2504/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=480,768,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2505/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=480,960,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=2506/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=481,152,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=2507/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=481,344,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2508/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=481,536,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2509/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=481,728,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2510/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=481,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2511/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=482,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2512/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=482,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2513/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=482,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2514/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=482,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2515/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=482,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2516/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=483,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2517/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=483,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2518/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=483,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2519/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=483,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2520/500000]
+ optim/total_grad_norm=2.119
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=483,840,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2521/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=484,032,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2522/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=484,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2523/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=484,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2524/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=484,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2525/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=484,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2526/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=484,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2527/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=485,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2528/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=485,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2529/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=485,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2530/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=485,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2531/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=485,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2532/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=486,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2533/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=486,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2534/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=486,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2535/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=486,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2536/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=486,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2537/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=487,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2538/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=487,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2539/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=487,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2540/500000]
+ optim/total_grad_norm=2.394
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=487,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2541/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=487,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2542/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=488,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2543/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=488,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2544/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=488,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2545/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=488,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2546/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=488,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2547/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=489,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2548/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=489,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2549/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=489,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2550/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=489,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2551/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=489,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2552/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=489,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2553/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=490,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2554/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=490,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2555/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=490,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2556/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=490,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2557/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=490,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2558/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=491,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2559/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=491,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2560/500000]
+ optim/total_grad_norm=3.090
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=491,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2561/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=491,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2562/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=491,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2563/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=492,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2564/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=492,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2565/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=492,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2566/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=492,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2567/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=492,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2568/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=493,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2569/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=493,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2570/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=493,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2571/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=493,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2572/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=493,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2573/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=494,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2574/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=494,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2575/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=494,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2576/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=494,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2577/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=494,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2578/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=494,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2579/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=495,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2580/500000]
+ optim/total_grad_norm=1.892
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=495,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2581/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=495,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2582/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=495,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2583/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=495,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2584/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=496,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2585/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=496,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2586/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=496,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2587/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=496,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2588/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=496,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2589/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=497,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2590/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=497,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2591/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=497,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2592/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=497,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2593/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=497,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2594/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=498,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2595/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=498,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2596/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=498,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2597/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=498,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2598/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=498,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2599/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=499,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2600/500000]
+ optim/total_grad_norm=2.665
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=499,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2601/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=499,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2602/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=499,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2603/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=499,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2604/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=499,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2605/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=500,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2606/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=500,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2607/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=500,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2608/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=500,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2609/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=500,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2610/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=501,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2611/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=501,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2612/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=501,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2613/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=501,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2614/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=501,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2615/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=502,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2616/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=502,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2617/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=502,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2618/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=502,656,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2619/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=502,848,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2620/500000]
+ optim/total_grad_norm=2.145
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=503,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2621/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=503,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2622/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=503,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2623/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=503,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2624/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=503,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2625/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=504,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2626/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=504,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2627/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=504,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2628/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=504,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2629/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=504,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2630/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=504,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2631/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=505,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2632/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=505,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2633/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=505,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2634/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=505,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2635/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=505,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2636/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=506,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2637/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=506,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2638/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=506,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2639/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=506,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2640/500000]
+ optim/total_grad_norm=1.775
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=506,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2641/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=507,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2642/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=507,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2643/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=507,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2644/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=507,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2645/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=507,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2646/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=508,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2647/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=508,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2648/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=508,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2649/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=508,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2650/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=508,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2651/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=508,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2652/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=509,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2653/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=509,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2654/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=509,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2655/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=509,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2656/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=509,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2657/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=510,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2658/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=510,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2659/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=510,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2660/500000]
+ optim/total_grad_norm=2.228
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=510,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2661/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=510,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2662/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=511,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2663/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=511,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2664/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=511,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2665/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=511,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2666/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=511,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2667/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=512,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2668/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=512,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2669/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=512,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2670/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=512,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2671/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=512,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2672/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=513,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2673/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=513,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2674/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=513,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2675/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=513,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2676/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=513,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2677/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=513,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2678/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=514,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2679/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=514,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2680/500000]
+ optim/total_grad_norm=1.907
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=514,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2681/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=514,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2682/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=514,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2683/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=515,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2684/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=515,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2685/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=515,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2686/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=515,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2687/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=515,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2688/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=516,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2689/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=516,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2690/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=516,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2691/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=516,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2692/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=516,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2693/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=517,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2694/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=517,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2695/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=517,440,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2696/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=517,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2697/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=517,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2698/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=518,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2699/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=518,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2700/500000]
+ optim/total_grad_norm=1.593
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=518,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2701/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=518,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2702/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=518,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2703/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=518,976,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2704/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=519,168,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2705/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=519,360,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2706/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=519,552,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2707/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=519,744,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2708/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=519,936,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2709/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=520,128,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2710/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=520,320,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=2711/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=520,512,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2712/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=520,704,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2713/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=520,896,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2714/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=521,088,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2715/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=521,280,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2716/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=521,472,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2717/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=521,664,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2718/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=521,856,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2719/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=522,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2720/500000]
+ optim/total_grad_norm=2.913
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=522,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2721/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=522,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2722/500000]
+ train/ActionNoiseL2Loss=0.1388
+ throughput/total_tokens=522,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2723/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=522,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2724/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=523,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2725/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=523,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2726/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=523,392,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2727/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=523,584,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2728/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=523,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2729/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=523,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2730/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=524,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2731/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=524,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2732/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=524,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2733/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=524,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2734/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=524,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2735/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=525,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2736/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=525,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2737/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=525,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2738/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=525,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2739/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=525,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2740/500000]
+ optim/total_grad_norm=1.924
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=526,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2741/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=526,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2742/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=526,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2743/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=526,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2744/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=526,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2745/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=527,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2746/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=527,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2747/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=527,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2748/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=527,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2749/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=527,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2750/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=528,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2751/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=528,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2752/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=528,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2753/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=528,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2754/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=528,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2755/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=528,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2756/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=529,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2757/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=529,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2758/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=529,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2759/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=529,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2760/500000]
+ optim/total_grad_norm=2.694
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=529,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2761/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=530,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2762/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=530,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2763/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=530,496,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2764/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=530,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2765/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=530,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2766/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=531,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2767/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=531,264,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2768/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=531,456,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2769/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=531,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2770/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=531,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2771/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=532,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2772/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=532,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2773/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=532,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2774/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=532,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2775/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=532,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2776/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=532,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2777/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=533,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2778/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=533,376,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2779/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=533,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2780/500000]
+ optim/total_grad_norm=1.632
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=533,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2781/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=533,952,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2782/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=534,144,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2783/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=534,336,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2784/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=534,528,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2785/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=534,720,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2786/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=534,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2787/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=535,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2788/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=535,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2789/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=535,488,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2790/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=535,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2791/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=535,872,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2792/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=536,064,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2793/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=536,256,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2794/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=536,448,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2795/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=536,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2796/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=536,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2797/500000]
+ train/ActionNoiseL2Loss=0.1191
+ throughput/total_tokens=537,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2798/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=537,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2799/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=537,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2800/500000]
+ optim/total_grad_norm=2.295
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=537,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2801/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=537,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2802/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=537,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=2803/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=538,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2804/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=538,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2805/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=538,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2806/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=538,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2807/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=538,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2808/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=539,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2809/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=539,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2810/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=539,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2811/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=539,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2812/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=539,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2813/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=540,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2814/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=540,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2815/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=540,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2816/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=540,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2817/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=540,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2818/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=541,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2819/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=541,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2820/500000]
+ optim/total_grad_norm=2.105
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=541,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2821/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=541,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2822/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=541,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2823/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=542,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2824/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=542,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2825/500000]
+ train/ActionNoiseL2Loss=0.1639
+ throughput/total_tokens=542,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2826/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=542,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2827/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=542,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2828/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=542,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2829/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=543,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2830/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=543,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2831/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=543,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2832/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=543,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2833/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=543,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2834/500000]
+ train/ActionNoiseL2Loss=0.1536
+ throughput/total_tokens=544,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2835/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=544,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2836/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=544,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2837/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=544,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2838/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=544,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2839/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=545,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2840/500000]
+ optim/total_grad_norm=1.368
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=545,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2841/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=545,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2842/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=545,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2843/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=545,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2844/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=546,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2845/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=546,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2846/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=546,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2847/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=546,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2848/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=546,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2849/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=547,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2850/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=547,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2851/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=547,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2852/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=547,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2853/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=547,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2854/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=547,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2855/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=548,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2856/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=548,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2857/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=548,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2858/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=548,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2859/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=548,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2860/500000]
+ optim/total_grad_norm=1.656
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=549,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2861/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=549,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2862/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=549,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2863/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=549,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2864/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=549,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2865/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=550,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2866/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=550,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2867/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=550,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2868/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=550,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2869/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=550,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2870/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=551,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2871/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=551,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2872/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=551,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2873/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=551,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2874/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=551,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2875/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=552,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2876/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=552,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2877/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=552,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2878/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=552,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2879/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=552,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2880/500000]
+ optim/total_grad_norm=2.356
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=552,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2881/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=553,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2882/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=553,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2883/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=553,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2884/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=553,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2885/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=553,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2886/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=554,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2887/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=554,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2888/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=554,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2889/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=554,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2890/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=554,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2891/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=555,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2892/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=555,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2893/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=555,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2894/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=555,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2895/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=555,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2896/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=556,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2897/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=556,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2898/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=556,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2899/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=556,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2900/500000]
+ optim/total_grad_norm=1.933
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=556,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2901/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=556,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2902/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=557,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2903/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=557,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2904/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=557,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2905/500000]
+ train/ActionNoiseL2Loss=0.1771
+ throughput/total_tokens=557,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2906/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=557,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2907/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=558,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2908/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=558,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2909/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=558,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2910/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=558,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=2911/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=558,912,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2912/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=559,104,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2913/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=559,296,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2914/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=559,488,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=2915/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=559,680,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=2916/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=559,872,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2917/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=560,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2918/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=560,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2919/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=560,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=2920/500000]
+ optim/total_grad_norm=1.640
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=560,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2921/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=560,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2922/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=561,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2923/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=561,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2924/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=561,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2925/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=561,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2926/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=561,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2927/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=561,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2928/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=562,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2929/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=562,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2930/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=562,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2931/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=562,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2932/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=562,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2933/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=563,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2934/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=563,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2935/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=563,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2936/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=563,712,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2937/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=563,904,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2938/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=564,096,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2939/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=564,288,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2940/500000]
+ optim/total_grad_norm=1.403
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=564,480,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2941/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=564,672,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2942/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=564,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2943/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=565,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2944/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=565,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2945/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=565,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2946/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=565,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2947/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=565,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2948/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=566,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2949/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=566,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2950/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=566,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2951/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=566,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2952/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=566,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2953/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=566,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2954/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=567,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2955/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=567,360,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=2956/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=567,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2957/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=567,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2958/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=567,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2959/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=568,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2960/500000]
+ optim/total_grad_norm=1.383
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=568,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=2961/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=568,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2962/500000]
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=568,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2963/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=568,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2964/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=569,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2965/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=569,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2966/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=569,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2967/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=569,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2968/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=569,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2969/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=570,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=2970/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=570,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2971/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=570,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2972/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=570,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2973/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=570,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2974/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=571,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=2975/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=571,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2976/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=571,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2977/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=571,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2978/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=571,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2979/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=571,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=2980/500000]
+ optim/total_grad_norm=1.797
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=572,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=2981/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=572,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2982/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=572,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2983/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=572,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2984/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=572,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2985/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=573,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2986/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=573,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2987/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=573,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2988/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=573,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2989/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=573,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2990/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=574,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=2991/500000]
+ train/ActionNoiseL2Loss=0.1479
+ throughput/total_tokens=574,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2992/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=574,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2993/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=574,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=2994/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=574,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2995/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=575,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2996/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=575,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2997/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=575,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2998/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=575,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=2999/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=575,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3000/500000]
+ optim/total_grad_norm=1.694
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=576,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/25 [02:25:32] INFO | >> Saving config... checkpoint.py:608
+09/25 [02:26:03] INFO | >> Saving model state... checkpoint.py:796
+09/25 [02:27:04] INFO | >> Saving optim state... checkpoint.py:811
+09/25 [02:27:09] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3001/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=576,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3002/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=576,384,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=3003/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=576,576,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=3004/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=576,768,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=3005/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=576,960,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=3006/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=577,152,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=3007/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=577,344,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=3008/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=577,536,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=3009/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=577,728,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=3010/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=577,920,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3011/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=578,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3012/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=578,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3013/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=578,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3014/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=578,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3015/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=578,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3016/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=579,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3017/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=579,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3018/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=579,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3019/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=579,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3020/500000]
+ optim/total_grad_norm=1.834
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=579,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3021/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=580,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3022/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=580,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3023/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=580,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3024/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=580,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3025/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=580,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3026/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=580,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3027/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=581,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3028/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=581,376,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3029/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=581,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3030/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=581,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3031/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=581,952,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3032/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=582,144,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3033/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=582,336,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3034/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=582,528,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3035/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=582,720,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3036/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=582,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3037/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=583,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3038/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=583,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3039/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=583,488,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3040/500000]
+ optim/total_grad_norm=1.887
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=583,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3041/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=583,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3042/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=584,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3043/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=584,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3044/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=584,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3045/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=584,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3046/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=584,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3047/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=585,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3048/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=585,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3049/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=585,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3050/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=585,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3051/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=585,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3052/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=585,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3053/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=586,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3054/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=586,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3055/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=586,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3056/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=586,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3057/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=586,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3058/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=587,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3059/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=587,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3060/500000]
+ optim/total_grad_norm=2.328
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=587,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3061/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=587,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3062/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=587,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3063/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=588,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3064/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=588,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3065/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=588,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3066/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=588,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3067/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=588,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3068/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=589,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3069/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=589,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3070/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=589,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3071/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=589,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3072/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=589,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3073/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=590,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3074/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=590,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3075/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=590,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3076/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=590,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3077/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=590,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3078/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=590,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3079/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=591,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3080/500000]
+ optim/total_grad_norm=2.384
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=591,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3081/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=591,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3082/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=591,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3083/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=591,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3084/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=592,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3085/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=592,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3086/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=592,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3087/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=592,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3088/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=592,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3089/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=593,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3090/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=593,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3091/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=593,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3092/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=593,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3093/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=593,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3094/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=594,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3095/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=594,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3096/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=594,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3097/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=594,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3098/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=594,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3099/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=595,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3100/500000]
+ optim/total_grad_norm=1.783
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=595,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3101/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=595,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3102/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=595,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3103/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=595,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3104/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=595,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3105/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=596,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3106/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=596,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3107/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=596,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3108/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=596,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3109/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=596,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3110/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=597,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3111/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=597,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3112/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=597,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3113/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=597,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3114/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=597,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3115/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=598,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3116/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=598,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3117/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=598,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3118/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=598,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3119/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=598,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3120/500000]
+ optim/total_grad_norm=1.122
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=599,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3121/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=599,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3122/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=599,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3123/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=599,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3124/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=599,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3125/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=600,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3126/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=600,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3127/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=600,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3128/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=600,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3129/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=600,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3130/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=600,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3131/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=601,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3132/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=601,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3133/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=601,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3134/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=601,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3135/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=601,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3136/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=602,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3137/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=602,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3138/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=602,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3139/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=602,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3140/500000]
+ optim/total_grad_norm=2.090
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=602,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3141/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=603,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3142/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=603,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3143/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=603,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3144/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=603,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3145/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=603,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3146/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=604,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3147/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=604,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3148/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=604,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3149/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=604,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3150/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=604,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3151/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=604,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3152/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=605,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3153/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=605,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3154/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=605,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3155/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=605,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3156/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=605,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3157/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=606,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3158/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=606,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3159/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=606,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3160/500000]
+ optim/total_grad_norm=1.506
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=606,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3161/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=606,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3162/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=607,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3163/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=607,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3164/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=607,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3165/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=607,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3166/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=607,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3167/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=608,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3168/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=608,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3169/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=608,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3170/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=608,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3171/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=608,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3172/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=609,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3173/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=609,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3174/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=609,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3175/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=609,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3176/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=609,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3177/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=609,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3178/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=610,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3179/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=610,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3180/500000]
+ optim/total_grad_norm=2.617
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=610,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3181/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=610,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3182/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=610,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3183/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=611,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3184/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=611,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3185/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=611,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3186/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=611,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3187/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=611,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3188/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=612,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3189/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=612,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3190/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=612,480,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3191/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=612,672,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3192/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=612,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3193/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=613,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3194/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=613,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3195/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=613,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3196/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=613,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3197/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=613,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3198/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=614,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3199/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=614,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3200/500000]
+ optim/total_grad_norm=1.830
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=614,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3201/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=614,592,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3202/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=614,784,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3203/500000]
+ train/ActionNoiseL2Loss=0.1535
+ throughput/total_tokens=614,976,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3204/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=615,168,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3205/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=615,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3206/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=615,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3207/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=615,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3208/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=615,936,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3209/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=616,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3210/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=616,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3211/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=616,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3212/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=616,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3213/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=616,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3214/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=617,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3215/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=617,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3216/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=617,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3217/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=617,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3218/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=617,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3219/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=618,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3220/500000]
+ optim/total_grad_norm=1.411
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=618,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3221/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=618,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3222/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=618,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3223/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=618,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3224/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=619,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3225/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=619,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3226/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=619,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3227/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=619,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3228/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=619,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3229/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=619,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3230/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=620,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3231/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=620,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3232/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=620,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3233/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=620,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3234/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=620,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3235/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=621,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3236/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=621,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3237/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=621,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3238/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=621,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3239/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=621,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3240/500000]
+ optim/total_grad_norm=2.094
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=622,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3241/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=622,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3242/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=622,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3243/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=622,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3244/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=622,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3245/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=623,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3246/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=623,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3247/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=623,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3248/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=623,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3249/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=623,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3250/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=624,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3251/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=624,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3252/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=624,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3253/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=624,576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3254/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=624,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3255/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=624,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3256/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=625,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3257/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=625,344,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3258/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=625,536,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3259/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=625,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3260/500000]
+ optim/total_grad_norm=1.679
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=625,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3261/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=626,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3262/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=626,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3263/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=626,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3264/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=626,688,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3265/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=626,880,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3266/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=627,072,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3267/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=627,264,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3268/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=627,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3269/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=627,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3270/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=627,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3271/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=628,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3272/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=628,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3273/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=628,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3274/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=628,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3275/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=628,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3276/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=628,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3277/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=629,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3278/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=629,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3279/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=629,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3280/500000]
+ optim/total_grad_norm=2.646
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=629,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3281/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=629,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3282/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=630,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3283/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=630,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3284/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=630,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3285/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=630,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3286/500000]
+ train/ActionNoiseL2Loss=0.1637
+ throughput/total_tokens=630,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3287/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=631,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3288/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=631,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3289/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=631,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3290/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=631,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3291/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=631,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3292/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=632,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3293/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=632,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3294/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=632,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3295/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=632,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3296/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=632,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3297/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=633,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3298/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=633,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3299/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=633,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3300/500000]
+ optim/total_grad_norm=1.889
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=633,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3301/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=633,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3302/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=633,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3303/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=634,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3304/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=634,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3305/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=634,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3306/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=634,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3307/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=634,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3308/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=635,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3309/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=635,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3310/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=635,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3311/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=635,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3312/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=635,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3313/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=636,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3314/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=636,288,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3315/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=636,480,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3316/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=636,672,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3317/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=636,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3318/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=637,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3319/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=637,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3320/500000]
+ optim/total_grad_norm=1.302
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=637,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3321/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=637,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3322/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=637,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3323/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=638,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3324/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=638,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3325/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=638,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3326/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=638,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3327/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=638,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3328/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=638,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3329/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=639,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3330/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=639,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3331/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=639,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3332/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=639,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3333/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=639,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3334/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=640,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3335/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=640,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3336/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=640,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3337/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=640,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3338/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=640,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3339/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=641,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3340/500000]
+ optim/total_grad_norm=1.135
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=641,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3341/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=641,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3342/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=641,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3343/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=641,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3344/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=642,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3345/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=642,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3346/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=642,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3347/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=642,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3348/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=642,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3349/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=643,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3350/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=643,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3351/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=643,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3352/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=643,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3353/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=643,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3354/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=643,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3355/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=644,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3356/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=644,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3357/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=644,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3358/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=644,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3359/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=644,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3360/500000]
+ optim/total_grad_norm=1.906
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=645,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3361/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=645,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3362/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=645,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3363/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=645,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3364/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=645,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3365/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=646,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3366/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=646,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3367/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=646,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3368/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=646,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3369/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=646,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3370/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=647,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3371/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=647,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3372/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=647,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3373/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=647,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3374/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=647,808,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3375/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=648,000,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3376/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=648,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3377/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=648,384,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3378/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=648,576,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3379/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=648,768,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3380/500000]
+ optim/total_grad_norm=2.072
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=648,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3381/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=649,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3382/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=649,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3383/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=649,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3384/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=649,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3385/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=649,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3386/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=650,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3387/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=650,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3388/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=650,496,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3389/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=650,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3390/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=650,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3391/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=651,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3392/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=651,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3393/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=651,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3394/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=651,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3395/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=651,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3396/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=652,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3397/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=652,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3398/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=652,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3399/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=652,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3400/500000]
+ optim/total_grad_norm=1.511
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=652,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3401/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=652,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3402/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=653,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3403/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=653,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3404/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=653,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3405/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=653,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3406/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=653,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3407/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=654,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3408/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=654,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3409/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=654,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3410/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=654,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3411/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=654,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3412/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=655,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3413/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=655,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3414/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=655,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3415/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=655,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3416/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=655,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3417/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=656,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3418/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=656,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3419/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=656,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3420/500000]
+ optim/total_grad_norm=1.535
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=656,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3421/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=656,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3422/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=657,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3423/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=657,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3424/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=657,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3425/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=657,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3426/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=657,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3427/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=657,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3428/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=658,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3429/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=658,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3430/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=658,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3431/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=658,752,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3432/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=658,944,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3433/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=659,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3434/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=659,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3435/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=659,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3436/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=659,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3437/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=659,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3438/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=660,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3439/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=660,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3440/500000]
+ optim/total_grad_norm=2.180
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=660,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3441/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=660,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3442/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=660,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3443/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=661,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3444/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=661,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3445/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=661,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3446/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=661,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3447/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=661,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3448/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=662,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3449/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=662,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3450/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=662,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3451/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=662,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3452/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=662,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3453/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=662,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3454/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=663,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3455/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=663,360,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3456/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=663,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3457/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=663,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3458/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=663,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3459/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=664,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3460/500000]
+ optim/total_grad_norm=2.045
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=664,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3461/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=664,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3462/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=664,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3463/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=664,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3464/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=665,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3465/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=665,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3466/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=665,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3467/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=665,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3468/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=665,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3469/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=666,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3470/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=666,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3471/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=666,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3472/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=666,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3473/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=666,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3474/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=667,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3475/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=667,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3476/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=667,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3477/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=667,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3478/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=667,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3479/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=667,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3480/500000]
+ optim/total_grad_norm=0.9537
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=668,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3481/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=668,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3482/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=668,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3483/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=668,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3484/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=668,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3485/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=669,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3486/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=669,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3487/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=669,504,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3488/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=669,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3489/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=669,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3490/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=670,080,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3491/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=670,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3492/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=670,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3493/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=670,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3494/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=670,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3495/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=671,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3496/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=671,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3497/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=671,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3498/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=671,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3499/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=671,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3500/500000]
+ optim/total_grad_norm=1.120
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=672,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/25 [05:25:37] INFO | >> Saving config... checkpoint.py:608
+09/25 [05:26:17] INFO | >> Saving model state... checkpoint.py:796
+09/25 [05:27:18] INFO | >> Saving optim state... checkpoint.py:811
+09/25 [05:27:23] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3501/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=672,192,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=3502/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=672,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3503/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=672,576,000
+ throughput/device/tokens_per_second=1,099
+ throughput/device/batches_per_second=0.0458
+[step=3504/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=672,768,000
+ throughput/device/tokens_per_second=1,100
+ throughput/device/batches_per_second=0.0459
+[step=3505/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=672,960,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3506/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=673,152,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3507/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=673,344,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=3508/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=673,536,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3509/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=673,728,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3510/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=673,920,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,437
+[step=3511/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=674,112,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3512/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=674,304,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3513/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=674,496,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3514/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=674,688,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3515/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=674,880,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=3516/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=675,072,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=3517/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=675,264,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=3518/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=675,456,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=3519/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=675,648,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=3520/500000]
+ optim/total_grad_norm=2.809
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=675,840,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=3521/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=676,032,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=3522/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=676,224,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=3523/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=676,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3524/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=676,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3525/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=676,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3526/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=676,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3527/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=677,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3528/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=677,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3529/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=677,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3530/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=677,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3531/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=677,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3532/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=678,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3533/500000]
+ train/ActionNoiseL2Loss=0.1545
+ throughput/total_tokens=678,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3534/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=678,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3535/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=678,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3536/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=678,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3537/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=679,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3538/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=679,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3539/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=679,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3540/500000]
+ optim/total_grad_norm=1.796
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=679,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3541/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=679,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3542/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=680,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3543/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=680,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3544/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=680,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3545/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=680,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3546/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=680,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3547/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=681,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3548/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=681,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3549/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=681,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3550/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=681,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3551/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=681,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3552/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=681,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3553/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=682,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3554/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=682,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3555/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=682,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3556/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=682,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3557/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=682,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3558/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=683,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3559/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=683,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3560/500000]
+ optim/total_grad_norm=1.525
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=683,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3561/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=683,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3562/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=683,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3563/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=684,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3564/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=684,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3565/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=684,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3566/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=684,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3567/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=684,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3568/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=685,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3569/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=685,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3570/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=685,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3571/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=685,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3572/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=685,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3573/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=686,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3574/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=686,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3575/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=686,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3576/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=686,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3577/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=686,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3578/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=686,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3579/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=687,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3580/500000]
+ optim/total_grad_norm=1.402
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=687,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3581/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=687,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3582/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=687,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3583/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=687,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3584/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=688,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3585/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=688,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3586/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=688,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3587/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=688,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3588/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=688,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3589/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=689,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3590/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=689,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3591/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=689,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3592/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=689,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3593/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=689,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3594/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=690,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3595/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=690,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3596/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=690,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3597/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=690,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3598/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=690,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3599/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=691,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3600/500000]
+ optim/total_grad_norm=1.805
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=691,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3601/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=691,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3602/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=691,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3603/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=691,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3604/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=691,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3605/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=692,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3606/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=692,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3607/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=692,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3608/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=692,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3609/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=692,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3610/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=693,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3611/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=693,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3612/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=693,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3613/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=693,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3614/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=693,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3615/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=694,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3616/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=694,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3617/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=694,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3618/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=694,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3619/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=694,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3620/500000]
+ optim/total_grad_norm=2.152
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=695,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3621/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=695,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3622/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=695,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3623/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=695,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3624/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=695,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3625/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=696,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3626/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=696,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3627/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=696,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3628/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=696,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3629/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=696,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3630/500000]
+ train/ActionNoiseL2Loss=0.1943
+ throughput/total_tokens=696,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3631/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=697,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3632/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=697,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3633/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=697,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3634/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=697,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3635/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=697,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3636/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=698,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3637/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=698,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3638/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=698,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3639/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=698,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3640/500000]
+ optim/total_grad_norm=1.250
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=698,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3641/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=699,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3642/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=699,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3643/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=699,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3644/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=699,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3645/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=699,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3646/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=700,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3647/500000]
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=700,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3648/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=700,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3649/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=700,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3650/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=700,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3651/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=700,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3652/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=701,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3653/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=701,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3654/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=701,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3655/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=701,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3656/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=701,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3657/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=702,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3658/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=702,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3659/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=702,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3660/500000]
+ optim/total_grad_norm=1.222
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=702,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3661/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=702,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3662/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=703,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3663/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=703,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3664/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=703,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3665/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=703,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3666/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=703,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3667/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=704,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3668/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=704,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3669/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=704,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3670/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=704,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3671/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=704,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3672/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=705,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3673/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=705,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3674/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=705,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3675/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=705,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3676/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=705,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3677/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=705,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3678/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=706,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3679/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=706,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3680/500000]
+ optim/total_grad_norm=1.642
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=706,560,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3681/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=706,752,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3682/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=706,944,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3683/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=707,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3684/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=707,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3685/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=707,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3686/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=707,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3687/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=707,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3688/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=708,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3689/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=708,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3690/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=708,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3691/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=708,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3692/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=708,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3693/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=709,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3694/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=709,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3695/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=709,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3696/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=709,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3697/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=709,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3698/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=710,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3699/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=710,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3700/500000]
+ optim/total_grad_norm=1.499
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=710,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3701/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=710,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3702/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=710,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3703/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=710,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3704/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=711,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3705/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=711,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3706/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=711,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3707/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=711,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3708/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=711,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3709/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=712,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=3710/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=712,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3711/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=712,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3712/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=712,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3713/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=712,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3714/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=713,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3715/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=713,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3716/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=713,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3717/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=713,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3718/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=713,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3719/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=714,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3720/500000]
+ optim/total_grad_norm=1.591
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=714,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3721/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=714,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3722/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=714,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3723/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=714,816,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3724/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=715,008,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3725/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=715,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3726/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=715,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3727/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=715,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3728/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=715,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3729/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=715,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3730/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=716,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3731/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=716,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3732/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=716,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3733/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=716,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3734/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=716,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3735/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=717,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3736/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=717,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3737/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=717,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3738/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=717,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3739/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=717,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3740/500000]
+ optim/total_grad_norm=1.354
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=718,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3741/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=718,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3742/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=718,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3743/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=718,656,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3744/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=718,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3745/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=719,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3746/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=719,232,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3747/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=719,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3748/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=719,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3749/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=719,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3750/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=720,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3751/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=720,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3752/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=720,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3753/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=720,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3754/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=720,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3755/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=720,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3756/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=721,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3757/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=721,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3758/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=721,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3759/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=721,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3760/500000]
+ optim/total_grad_norm=0.8051
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=721,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3761/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=722,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3762/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=722,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3763/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=722,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3764/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=722,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3765/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=722,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3766/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=723,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3767/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=723,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3768/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=723,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3769/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=723,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3770/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=723,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3771/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=724,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3772/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=724,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3773/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=724,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3774/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=724,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3775/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=724,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3776/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=724,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3777/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=725,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3778/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=725,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3779/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=725,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3780/500000]
+ optim/total_grad_norm=1.812
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=725,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3781/500000]
+ train/ActionNoiseL2Loss=0.1747
+ throughput/total_tokens=725,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3782/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=726,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3783/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=726,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3784/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=726,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3785/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=726,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3786/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=726,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3787/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=727,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3788/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=727,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3789/500000]
+ train/ActionNoiseL2Loss=0.1501
+ throughput/total_tokens=727,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3790/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=727,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3791/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=727,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3792/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=728,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3793/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=728,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3794/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=728,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3795/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=728,640,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3796/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=728,832,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3797/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=729,024,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3798/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=729,216,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3799/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=729,408,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3800/500000]
+ optim/total_grad_norm=1.521
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=729,600,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3801/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=729,792,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=3802/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=729,984,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=3803/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=730,176,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3804/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=730,368,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3805/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=730,560,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3806/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=730,752,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=3807/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=730,944,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=3808/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=731,136,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=3809/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=731,328,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=3810/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=731,520,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3811/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=731,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3812/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=731,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3813/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=732,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3814/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=732,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3815/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=732,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3816/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=732,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3817/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=732,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3818/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=733,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3819/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=733,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3820/500000]
+ optim/total_grad_norm=1.887
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=733,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3821/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=733,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3822/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=733,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3823/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=734,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3824/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=734,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3825/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=734,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3826/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=734,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3827/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=734,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3828/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=734,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3829/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=735,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3830/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=735,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3831/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=735,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3832/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=735,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3833/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=735,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3834/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=736,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3835/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=736,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3836/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=736,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3837/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=736,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3838/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=736,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3839/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=737,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3840/500000]
+ optim/total_grad_norm=1.083
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=737,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3841/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=737,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3842/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=737,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3843/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=737,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3844/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=738,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3845/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=738,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3846/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=738,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3847/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=738,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3848/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=738,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3849/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=739,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3850/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=739,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3851/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=739,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3852/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=739,584,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3853/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=739,776,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3854/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=739,968,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3855/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=740,160,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3856/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=740,352,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3857/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=740,544,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3858/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=740,736,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3859/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=740,928,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3860/500000]
+ optim/total_grad_norm=1.972
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=741,120,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3861/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=741,312,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3862/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=741,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3863/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=741,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3864/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=741,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3865/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=742,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3866/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=742,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3867/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=742,464,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3868/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=742,656,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=3869/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=742,848,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=3870/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=743,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3871/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=743,232,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3872/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=743,424,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3873/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=743,616,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3874/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=743,808,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3875/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=744,000,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3876/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=744,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3877/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=744,384,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3878/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=744,576,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3879/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=744,768,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3880/500000]
+ optim/total_grad_norm=1.493
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=744,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3881/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=745,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3882/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=745,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3883/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=745,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3884/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=745,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3885/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=745,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3886/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=746,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3887/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=746,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3888/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=746,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3889/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=746,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3890/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=746,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3891/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=747,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3892/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=747,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3893/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=747,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3894/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=747,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3895/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=747,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3896/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=748,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3897/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=748,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3898/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=748,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3899/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=748,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3900/500000]
+ optim/total_grad_norm=1.460
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=748,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3901/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=748,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3902/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=749,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3903/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=749,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3904/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=749,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3905/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=749,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3906/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=749,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3907/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=750,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3908/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=750,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3909/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=750,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3910/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=750,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3911/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=750,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3912/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=751,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3913/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=751,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3914/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=751,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3915/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=751,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3916/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=751,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3917/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=752,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3918/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=752,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3919/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=752,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=3920/500000]
+ optim/total_grad_norm=1.504
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=752,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3921/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=752,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3922/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=753,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3923/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=753,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3924/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=753,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3925/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=753,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3926/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=753,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3927/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=753,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3928/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=754,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3929/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=754,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3930/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=754,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3931/500000]
+ train/ActionNoiseL2Loss=0.1496
+ throughput/total_tokens=754,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3932/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=754,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3933/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=755,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3934/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=755,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3935/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=755,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3936/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=755,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=3937/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=755,904,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3938/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=756,096,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3939/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=756,288,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3940/500000]
+ optim/total_grad_norm=1.722
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=756,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3941/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=756,672,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3942/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=756,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3943/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=757,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3944/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=757,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3945/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=757,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3946/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=757,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3947/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=757,824,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3948/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=758,016,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3949/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=758,208,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3950/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=758,400,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3951/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=758,592,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=3952/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=758,784,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3953/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=758,976,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3954/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=759,168,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3955/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=759,360,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3956/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=759,552,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3957/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=759,744,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3958/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=759,936,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3959/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=760,128,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3960/500000]
+ optim/total_grad_norm=1.622
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=760,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=3961/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=760,512,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3962/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=760,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3963/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=760,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=3964/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=761,088,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3965/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=761,280,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=3966/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=761,472,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=3967/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=761,664,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=3968/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=761,856,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3969/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=762,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=3970/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=762,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3971/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=762,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3972/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=762,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3973/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=762,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3974/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=763,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3975/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=763,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3976/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=763,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3977/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=763,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3978/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=763,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3979/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=763,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3980/500000]
+ optim/total_grad_norm=2.238
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=764,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=3981/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=764,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3982/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=764,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3983/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=764,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=3984/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=764,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3985/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=765,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=3986/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=765,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3987/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=765,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=3988/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=765,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3989/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=765,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3990/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=766,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=3991/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=766,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3992/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=766,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3993/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=766,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3994/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=766,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3995/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=767,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3996/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=767,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3997/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=767,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3998/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=767,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=3999/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=767,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4000/500000]
+ optim/total_grad_norm=3.094
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=768,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/25 [08:26:01] INFO | >> Saving config... checkpoint.py:608
+09/25 [08:26:37] INFO | >> Saving model state... checkpoint.py:796
+09/25 [08:27:38] INFO | >> Saving optim state... checkpoint.py:811
+09/25 [08:27:43] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4001/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=768,192,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=4002/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=768,384,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=4003/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=768,576,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=4004/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=768,768,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=4005/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=768,960,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=4006/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=769,152,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=4007/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=769,344,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=4008/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=769,536,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=4009/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=769,728,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=4010/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=769,920,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+ System/Peak GPU Memory (MB)=44,437
+[step=4011/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=770,112,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=4012/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=770,304,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=4013/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=770,496,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4014/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=770,688,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4015/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=770,880,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4016/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=771,072,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4017/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=771,264,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4018/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=771,456,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4019/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=771,648,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4020/500000]
+ optim/total_grad_norm=1.213
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=771,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4021/500000]
+ train/ActionNoiseL2Loss=0.1435
+ throughput/total_tokens=772,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4022/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=772,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4023/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=772,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4024/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=772,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4025/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=772,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4026/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=772,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4027/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=773,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4028/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=773,376,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4029/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=773,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4030/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=773,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4031/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=773,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4032/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=774,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4033/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=774,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4034/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=774,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4035/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=774,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4036/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=774,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4037/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=775,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4038/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=775,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4039/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=775,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4040/500000]
+ optim/total_grad_norm=1.986
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=775,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4041/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=775,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4042/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=776,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4043/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=776,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4044/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=776,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4045/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=776,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4046/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=776,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4047/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=777,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4048/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=777,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4049/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=777,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4050/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=777,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4051/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=777,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4052/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=777,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4053/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=778,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4054/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=778,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4055/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=778,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4056/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=778,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4057/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=778,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4058/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=779,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4059/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=779,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4060/500000]
+ optim/total_grad_norm=1.840
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=779,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4061/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=779,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4062/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=779,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4063/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=780,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4064/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=780,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4065/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=780,480,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4066/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=780,672,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=4067/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=780,864,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=4068/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=781,056,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=4069/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=781,248,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=4070/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=781,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4071/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=781,632,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4072/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=781,824,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4073/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=782,016,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4074/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=782,208,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4075/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=782,400,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4076/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=782,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4077/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=782,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4078/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=782,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4079/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=783,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4080/500000]
+ optim/total_grad_norm=1.896
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=783,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4081/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=783,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4082/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=783,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4083/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=783,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4084/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=784,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4085/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=784,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4086/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=784,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4087/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=784,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4088/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=784,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4089/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=785,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4090/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=785,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4091/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=785,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4092/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=785,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4093/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=785,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4094/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=786,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4095/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=786,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4096/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=786,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4097/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=786,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4098/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=786,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4099/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=787,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4100/500000]
+ optim/total_grad_norm=1.292
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=787,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4101/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=787,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4102/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=787,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4103/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=787,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4104/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=787,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4105/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=788,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4106/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=788,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4107/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=788,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4108/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=788,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4109/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=788,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4110/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=789,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4111/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=789,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4112/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=789,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4113/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=789,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4114/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=789,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4115/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=790,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4116/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=790,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4117/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=790,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4118/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=790,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4119/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=790,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4120/500000]
+ optim/total_grad_norm=2.090
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=791,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4121/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=791,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4122/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=791,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4123/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=791,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4124/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=791,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4125/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=792,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4126/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=792,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4127/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=792,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4128/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=792,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4129/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=792,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4130/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=792,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4131/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=793,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4132/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=793,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4133/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=793,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4134/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=793,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4135/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=793,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4136/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=794,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4137/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=794,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4138/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=794,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4139/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=794,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4140/500000]
+ optim/total_grad_norm=1.501
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=794,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4141/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=795,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4142/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=795,264,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4143/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=795,456,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4144/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=795,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4145/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=795,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4146/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=796,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4147/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=796,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4148/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=796,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4149/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=796,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4150/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=796,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4151/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=796,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4152/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=797,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4153/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=797,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4154/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=797,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4155/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=797,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4156/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=797,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4157/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=798,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4158/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=798,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4159/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=798,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4160/500000]
+ optim/total_grad_norm=1.343
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=798,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4161/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=798,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4162/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=799,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4163/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=799,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4164/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=799,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4165/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=799,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4166/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=799,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4167/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=800,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4168/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=800,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4169/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=800,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4170/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=800,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4171/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=800,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4172/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=801,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4173/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=801,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4174/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=801,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4175/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=801,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4176/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=801,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4177/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=801,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4178/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=802,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4179/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=802,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4180/500000]
+ optim/total_grad_norm=1.212
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=802,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4181/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=802,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4182/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=802,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4183/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=803,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4184/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=803,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4185/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=803,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4186/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=803,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4187/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=803,904,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4188/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=804,096,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4189/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=804,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4190/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=804,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4191/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=804,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4192/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=804,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4193/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=805,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4194/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=805,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4195/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=805,440,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4196/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=805,632,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4197/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=805,824,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4198/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=806,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4199/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=806,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4200/500000]
+ optim/total_grad_norm=1.562
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=806,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4201/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=806,592,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4202/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=806,784,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4203/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=806,976,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4204/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=807,168,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4205/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=807,360,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=4206/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=807,552,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=4207/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=807,744,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=4208/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=807,936,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4209/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=808,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4210/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=808,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4211/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=808,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4212/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=808,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4213/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=808,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4214/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=809,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4215/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=809,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4216/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=809,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4217/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=809,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4218/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=809,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4219/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=810,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4220/500000]
+ optim/total_grad_norm=1.110
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=810,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4221/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=810,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4222/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=810,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4223/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=810,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4224/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=811,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4225/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=811,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4226/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=811,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4227/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=811,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4228/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=811,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4229/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=811,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4230/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=812,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4231/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=812,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4232/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=812,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4233/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=812,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4234/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=812,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4235/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=813,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4236/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=813,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4237/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=813,504,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4238/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=813,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4239/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=813,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4240/500000]
+ optim/total_grad_norm=2.102
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=814,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4241/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=814,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4242/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=814,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4243/500000]
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=814,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4244/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=814,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4245/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=815,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4246/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=815,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4247/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=815,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4248/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=815,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4249/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=815,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4250/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=816,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4251/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=816,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4252/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=816,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4253/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=816,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4254/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=816,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4255/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=816,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4256/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=817,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4257/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=817,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4258/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=817,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4259/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=817,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4260/500000]
+ optim/total_grad_norm=1.442
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=817,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4261/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=818,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4262/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=818,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4263/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=818,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4264/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=818,688,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4265/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=818,880,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4266/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=819,072,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4267/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=819,264,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4268/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=819,456,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4269/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=819,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4270/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=819,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4271/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=820,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4272/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=820,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4273/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=820,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4274/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=820,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4275/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=820,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4276/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=820,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4277/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=821,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4278/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=821,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4279/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=821,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4280/500000]
+ optim/total_grad_norm=2.056
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=821,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4281/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=821,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4282/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=822,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4283/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=822,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4284/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=822,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4285/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=822,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4286/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=822,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4287/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=823,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4288/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=823,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4289/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=823,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4290/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=823,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4291/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=823,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4292/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=824,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4293/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=824,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4294/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=824,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4295/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=824,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4296/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=824,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4297/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=825,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4298/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=825,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4299/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=825,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4300/500000]
+ optim/total_grad_norm=1.394
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=825,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4301/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=825,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4302/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=825,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4303/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=826,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4304/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=826,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4305/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=826,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4306/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=826,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4307/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=826,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4308/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=827,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4309/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=827,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4310/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=827,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4311/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=827,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4312/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=827,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4313/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=828,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4314/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=828,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4315/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=828,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4316/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=828,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4317/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=828,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4318/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=829,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4319/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=829,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4320/500000]
+ optim/total_grad_norm=1.390
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=829,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4321/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=829,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4322/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=829,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4323/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=830,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4324/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=830,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4325/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=830,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4326/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=830,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4327/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=830,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4328/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=830,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4329/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=831,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4330/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=831,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4331/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=831,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4332/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=831,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4333/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=831,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4334/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=832,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4335/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=832,320,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4336/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=832,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4337/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=832,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4338/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=832,896,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4339/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=833,088,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4340/500000]
+ optim/total_grad_norm=2.531
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=833,280,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4341/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=833,472,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4342/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=833,664,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4343/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=833,856,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4344/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=834,048,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4345/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=834,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4346/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=834,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4347/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=834,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4348/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=834,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4349/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=835,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4350/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=835,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4351/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=835,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4352/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=835,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4353/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=835,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4354/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=835,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4355/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=836,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4356/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=836,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4357/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=836,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4358/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=836,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4359/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=836,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4360/500000]
+ optim/total_grad_norm=1.302
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=837,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4361/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=837,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4362/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=837,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4363/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=837,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4364/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=837,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4365/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=838,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4366/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=838,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4367/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=838,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4368/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=838,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4369/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=838,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4370/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=839,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4371/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=839,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4372/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=839,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4373/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=839,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4374/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=839,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4375/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=840,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4376/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=840,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4377/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=840,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4378/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=840,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4379/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=840,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4380/500000]
+ optim/total_grad_norm=1.050
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=840,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4381/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=841,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4382/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=841,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4383/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=841,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4384/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=841,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4385/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=841,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4386/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=842,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4387/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=842,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4388/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=842,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4389/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=842,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4390/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=842,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4391/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=843,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4392/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=843,264,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4393/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=843,456,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4394/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=843,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4395/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=843,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4396/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=844,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4397/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=844,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4398/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=844,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4399/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=844,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4400/500000]
+ optim/total_grad_norm=1.444
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=844,800,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4401/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=844,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4402/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=845,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4403/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=845,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4404/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=845,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4405/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=845,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4406/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=845,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4407/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=846,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4408/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=846,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4409/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=846,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4410/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=846,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4411/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=846,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4412/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=847,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4413/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=847,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4414/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=847,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4415/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=847,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4416/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=847,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4417/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=848,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4418/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=848,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4419/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=848,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4420/500000]
+ optim/total_grad_norm=0.9808
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=848,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4421/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=848,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4422/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=849,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4423/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=849,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4424/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=849,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4425/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=849,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4426/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=849,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4427/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=849,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4428/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=850,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4429/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=850,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4430/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=850,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4431/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=850,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4432/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=850,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4433/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=851,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4434/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=851,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4435/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=851,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4436/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=851,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4437/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=851,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4438/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=852,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4439/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=852,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4440/500000]
+ optim/total_grad_norm=1.762
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=852,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4441/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=852,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4442/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=852,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4443/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=853,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4444/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=853,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4445/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=853,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4446/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=853,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4447/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=853,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4448/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=854,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4449/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=854,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4450/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=854,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4451/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=854,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4452/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=854,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4453/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=854,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4454/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=855,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4455/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=855,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4456/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=855,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4457/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=855,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4458/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=855,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4459/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=856,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4460/500000]
+ optim/total_grad_norm=1.279
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=856,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4461/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=856,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4462/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=856,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4463/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=856,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4464/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=857,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4465/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=857,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4466/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=857,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4467/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=857,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4468/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=857,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4469/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=858,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4470/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=858,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4471/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=858,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4472/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=858,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4473/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=858,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4474/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=859,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4475/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=859,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4476/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=859,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4477/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=859,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4478/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=859,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4479/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=859,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4480/500000]
+ optim/total_grad_norm=1.442
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=860,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4481/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=860,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4482/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=860,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4483/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=860,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4484/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=860,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4485/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=861,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4486/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=861,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4487/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=861,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4488/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=861,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4489/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=861,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4490/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=862,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4491/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=862,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4492/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=862,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4493/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=862,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4494/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=862,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4495/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=863,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4496/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=863,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4497/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=863,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4498/500000]
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=863,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4499/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=863,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4500/500000]
+ optim/total_grad_norm=1.151
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=864,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/25 [11:26:18] INFO | >> Saving config... checkpoint.py:608
+09/25 [11:26:57] INFO | >> Saving model state... checkpoint.py:796
+09/25 [11:27:58] INFO | >> Saving optim state... checkpoint.py:811
+09/25 [11:28:03] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4501/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=864,192,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=4502/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=864,384,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4503/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=864,576,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=4504/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=864,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4505/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=864,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4506/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=865,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4507/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=865,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4508/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=865,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4509/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=865,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4510/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=865,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4511/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=866,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4512/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=866,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4513/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=866,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4514/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=866,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4515/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=866,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4516/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=867,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4517/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=867,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4518/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=867,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4519/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=867,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4520/500000]
+ optim/total_grad_norm=1.436
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=867,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4521/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=868,032,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=4522/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=868,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4523/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=868,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4524/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=868,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4525/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=868,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4526/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=868,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4527/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=869,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4528/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=869,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4529/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=869,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4530/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=869,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4531/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=869,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4532/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=870,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4533/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=870,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4534/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=870,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4535/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=870,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4536/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=870,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4537/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=871,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4538/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=871,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4539/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=871,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4540/500000]
+ optim/total_grad_norm=1.362
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=871,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4541/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=871,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4542/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=872,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4543/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=872,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4544/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=872,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4545/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=872,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4546/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=872,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4547/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=873,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4548/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=873,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4549/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=873,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4550/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=873,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4551/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=873,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4552/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=873,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4553/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=874,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4554/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=874,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4555/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=874,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4556/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=874,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4557/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=874,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4558/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=875,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4559/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=875,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4560/500000]
+ optim/total_grad_norm=1.437
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=875,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4561/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=875,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4562/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=875,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4563/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=876,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4564/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=876,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4565/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=876,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4566/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=876,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4567/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=876,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4568/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=877,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4569/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=877,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4570/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=877,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4571/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=877,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4572/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=877,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4573/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=878,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4574/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=878,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4575/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=878,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4576/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=878,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4577/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=878,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4578/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=878,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4579/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=879,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4580/500000]
+ optim/total_grad_norm=0.9979
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=879,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4581/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=879,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4582/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=879,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4583/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=879,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4584/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=880,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4585/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=880,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4586/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=880,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4587/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=880,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4588/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=880,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4589/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=881,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4590/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=881,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4591/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=881,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4592/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=881,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4593/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=881,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4594/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=882,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4595/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=882,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4596/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=882,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4597/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=882,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4598/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=882,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4599/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=883,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4600/500000]
+ optim/total_grad_norm=1.189
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=883,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4601/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=883,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4602/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=883,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4603/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=883,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4604/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=883,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4605/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=884,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4606/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=884,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4607/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=884,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4608/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=884,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4609/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=884,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4610/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=885,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4611/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=885,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4612/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=885,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4613/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=885,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4614/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=885,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4615/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=886,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4616/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=886,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4617/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=886,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4618/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=886,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4619/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=886,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4620/500000]
+ optim/total_grad_norm=1.266
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=887,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4621/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=887,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4622/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=887,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4623/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=887,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4624/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=887,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4625/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=888,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4626/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=888,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4627/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=888,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4628/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=888,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4629/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=888,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4630/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=888,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4631/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=889,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4632/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=889,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4633/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=889,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4634/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=889,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4635/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=889,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4636/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=890,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4637/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=890,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4638/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=890,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4639/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=890,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4640/500000]
+ optim/total_grad_norm=1.677
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=890,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4641/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=891,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4642/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=891,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4643/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=891,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4644/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=891,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4645/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=891,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4646/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=892,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4647/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=892,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4648/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=892,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4649/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=892,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4650/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=892,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4651/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=892,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4652/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=893,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4653/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=893,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4654/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=893,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4655/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=893,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4656/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=893,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4657/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=894,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4658/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=894,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4659/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=894,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4660/500000]
+ optim/total_grad_norm=1.493
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=894,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4661/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=894,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4662/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=895,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4663/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=895,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4664/500000]
+ train/ActionNoiseL2Loss=0.1375
+ throughput/total_tokens=895,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4665/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=895,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4666/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=895,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4667/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=896,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4668/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=896,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4669/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=896,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4670/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=896,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4671/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=896,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4672/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=897,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4673/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=897,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4674/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=897,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4675/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=897,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4676/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=897,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4677/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=897,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4678/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=898,176,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4679/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=898,368,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4680/500000]
+ optim/total_grad_norm=1.659
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=898,560,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4681/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=898,752,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4682/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=898,944,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4683/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=899,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4684/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=899,328,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4685/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=899,520,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4686/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=899,712,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4687/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=899,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4688/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=900,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4689/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=900,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4690/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=900,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4691/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=900,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4692/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=900,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4693/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=901,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4694/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=901,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4695/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=901,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4696/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=901,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4697/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=901,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4698/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=902,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4699/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=902,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4700/500000]
+ optim/total_grad_norm=1.200
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=902,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4701/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=902,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4702/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=902,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4703/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=902,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4704/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=903,168,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4705/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=903,360,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4706/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=903,552,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4707/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=903,744,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4708/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=903,936,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4709/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=904,128,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4710/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=904,320,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4711/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=904,512,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4712/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=904,704,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4713/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=904,896,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=4714/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=905,088,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=4715/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=905,280,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=4716/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=905,472,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=4717/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=905,664,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=4718/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=905,856,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4719/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=906,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4720/500000]
+ optim/total_grad_norm=2.122
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=906,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4721/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=906,432,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4722/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=906,624,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4723/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=906,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4724/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=907,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4725/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=907,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4726/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=907,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4727/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=907,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4728/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=907,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4729/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=907,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4730/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=908,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4731/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=908,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4732/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=908,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4733/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=908,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4734/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=908,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4735/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=909,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4736/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=909,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4737/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=909,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4738/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=909,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4739/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=909,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4740/500000]
+ optim/total_grad_norm=1.509
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=910,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4741/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=910,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4742/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=910,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4743/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=910,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4744/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=910,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4745/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=911,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4746/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=911,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4747/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=911,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4748/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=911,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4749/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=911,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4750/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=912,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4751/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=912,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4752/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=912,384,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4753/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=912,576,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4754/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=912,768,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4755/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=912,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4756/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=913,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4757/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=913,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4758/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=913,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4759/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=913,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4760/500000]
+ optim/total_grad_norm=1.672
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=913,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4761/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=914,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4762/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=914,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4763/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=914,496,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4764/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=914,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4765/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=914,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4766/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=915,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4767/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=915,264,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4768/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=915,456,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4769/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=915,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4770/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=915,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4771/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=916,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4772/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=916,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4773/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=916,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4774/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=916,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4775/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=916,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4776/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=916,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4777/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=917,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4778/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=917,376,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4779/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=917,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4780/500000]
+ optim/total_grad_norm=1.919
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=917,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4781/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=917,952,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4782/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=918,144,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4783/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=918,336,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4784/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=918,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4785/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=918,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4786/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=918,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4787/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=919,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4788/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=919,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4789/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=919,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4790/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=919,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4791/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=919,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4792/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=920,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4793/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=920,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4794/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=920,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4795/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=920,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4796/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=920,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4797/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=921,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4798/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=921,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4799/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=921,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4800/500000]
+ optim/total_grad_norm=2.925
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=921,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4801/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=921,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4802/500000]
+ train/ActionNoiseL2Loss=0.1528
+ throughput/total_tokens=921,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4803/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=922,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4804/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=922,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4805/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=922,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4806/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=922,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4807/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=922,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4808/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=923,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4809/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=923,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4810/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=923,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4811/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=923,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4812/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=923,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4813/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=924,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4814/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=924,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4815/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=924,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4816/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=924,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4817/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=924,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4818/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=925,056,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4819/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=925,248,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=4820/500000]
+ optim/total_grad_norm=1.122
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=925,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4821/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=925,632,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4822/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=925,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4823/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=926,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4824/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=926,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4825/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=926,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4826/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=926,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4827/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=926,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4828/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=926,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4829/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=927,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4830/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=927,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4831/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=927,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4832/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=927,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4833/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=927,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4834/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=928,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4835/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=928,320,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4836/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=928,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4837/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=928,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4838/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=928,896,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4839/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=929,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4840/500000]
+ optim/total_grad_norm=0.8777
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=929,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4841/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=929,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4842/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=929,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4843/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=929,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4844/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=930,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4845/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=930,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4846/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=930,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4847/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=930,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4848/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=930,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4849/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=931,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4850/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=931,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4851/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=931,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4852/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=931,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4853/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=931,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4854/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=931,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4855/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=932,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4856/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=932,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4857/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=932,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4858/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=932,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4859/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=932,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4860/500000]
+ optim/total_grad_norm=3.065
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=933,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4861/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=933,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4862/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=933,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4863/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=933,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4864/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=933,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4865/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=934,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4866/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=934,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4867/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=934,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4868/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=934,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4869/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=934,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4870/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=935,040,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4871/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=935,232,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4872/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=935,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4873/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=935,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4874/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=935,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4875/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=936,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4876/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=936,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4877/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=936,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4878/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=936,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4879/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=936,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4880/500000]
+ optim/total_grad_norm=1.280
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=936,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4881/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=937,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4882/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=937,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4883/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=937,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4884/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=937,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4885/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=937,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4886/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=938,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4887/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=938,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4888/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=938,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4889/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=938,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4890/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=938,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4891/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=939,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4892/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=939,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4893/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=939,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4894/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=939,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4895/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=939,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4896/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=940,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4897/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=940,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4898/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=940,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4899/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=940,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4900/500000]
+ optim/total_grad_norm=1.635
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=940,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4901/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=940,992,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4902/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=941,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4903/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=941,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4904/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=941,568,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4905/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=941,760,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4906/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=941,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4907/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=942,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4908/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=942,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4909/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=942,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4910/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=942,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4911/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=942,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4912/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=943,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4913/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=943,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4914/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=943,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4915/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=943,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4916/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=943,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4917/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=944,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4918/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=944,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4919/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=944,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4920/500000]
+ optim/total_grad_norm=1.726
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=944,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4921/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=944,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4922/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=945,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4923/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=945,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4924/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=945,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4925/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=945,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4926/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=945,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4927/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=945,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4928/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=946,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4929/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=946,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=4930/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=946,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4931/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=946,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4932/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=946,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4933/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=947,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4934/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=947,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4935/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=947,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4936/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=947,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4937/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=947,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4938/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=948,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4939/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=948,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4940/500000]
+ optim/total_grad_norm=1.804
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=948,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4941/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=948,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4942/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=948,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4943/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=949,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4944/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=949,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4945/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=949,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4946/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=949,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4947/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=949,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4948/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=950,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4949/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=950,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4950/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=950,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4951/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=950,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4952/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=950,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4953/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=950,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4954/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=951,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4955/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=951,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4956/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=951,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4957/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=951,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4958/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=951,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4959/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=952,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4960/500000]
+ optim/total_grad_norm=1.820
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=952,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=4961/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=952,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4962/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=952,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4963/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=952,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4964/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=953,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4965/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=953,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4966/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=953,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4967/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=953,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4968/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=953,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4969/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=954,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4970/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=954,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4971/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=954,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4972/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=954,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4973/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=954,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4974/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=955,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4975/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=955,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4976/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=955,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4977/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=955,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4978/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=955,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4979/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=955,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4980/500000]
+ optim/total_grad_norm=3.203
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=956,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=4981/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=956,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4982/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=956,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4983/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=956,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4984/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=956,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4985/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=957,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4986/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=957,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4987/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=957,504,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4988/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=957,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4989/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=957,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4990/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=958,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=4991/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=958,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4992/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=958,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4993/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=958,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4994/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=958,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=4995/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=959,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4996/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=959,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4997/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=959,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4998/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=959,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4999/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=959,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5000/500000]
+ optim/total_grad_norm=1.533
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=960,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/25 [14:26:32] INFO | >> Saving config... checkpoint.py:608
+09/25 [14:27:08] INFO | >> Saving model state... checkpoint.py:796
+09/25 [14:28:09] INFO | >> Saving optim state... checkpoint.py:811
+09/25 [14:28:14] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5001/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=960,192,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=5002/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=960,384,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=5003/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=960,576,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=5004/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=960,768,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=5005/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=960,960,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5006/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=961,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5007/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=961,344,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5008/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=961,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5009/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=961,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5010/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=961,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5011/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=962,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5012/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=962,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5013/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=962,496,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5014/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=962,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5015/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=962,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5016/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=963,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5017/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=963,264,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5018/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=963,456,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5019/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=963,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5020/500000]
+ optim/total_grad_norm=1.078
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=963,840,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5021/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=964,032,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5022/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=964,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5023/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=964,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5024/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=964,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5025/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=964,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5026/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=964,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5027/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=965,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5028/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=965,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5029/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=965,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5030/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=965,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5031/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=965,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5032/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=966,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5033/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=966,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5034/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=966,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5035/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=966,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5036/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=966,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5037/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=967,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5038/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=967,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5039/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=967,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5040/500000]
+ optim/total_grad_norm=1.537
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=967,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5041/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=967,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5042/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=968,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5043/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=968,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5044/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=968,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5045/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=968,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5046/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=968,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5047/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=969,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5048/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=969,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5049/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=969,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5050/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=969,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5051/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=969,792,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5052/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=969,984,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5053/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=970,176,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5054/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=970,368,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5055/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=970,560,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=5056/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=970,752,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5057/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=970,944,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=5058/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=971,136,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5059/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=971,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5060/500000]
+ optim/total_grad_norm=1.406
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=971,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5061/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=971,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5062/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=971,904,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5063/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=972,096,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=5064/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=972,288,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5065/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=972,480,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5066/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=972,672,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5067/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=972,864,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5068/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=973,056,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5069/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=973,248,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5070/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=973,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5071/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=973,632,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5072/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=973,824,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5073/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=974,016,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5074/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=974,208,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5075/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=974,400,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5076/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=974,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5077/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=974,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5078/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=974,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5079/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=975,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5080/500000]
+ optim/total_grad_norm=1.397
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=975,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5081/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=975,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5082/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=975,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5083/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=975,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5084/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=976,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5085/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=976,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5086/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=976,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5087/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=976,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5088/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=976,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5089/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=977,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5090/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=977,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5091/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=977,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5092/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=977,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5093/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=977,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5094/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=978,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5095/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=978,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5096/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=978,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5097/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=978,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5098/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=978,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5099/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=979,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5100/500000]
+ optim/total_grad_norm=1.348
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=979,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5101/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=979,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5102/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=979,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5103/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=979,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5104/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=979,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5105/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=980,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5106/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=980,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5107/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=980,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5108/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=980,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5109/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=980,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5110/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=981,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5111/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=981,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5112/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=981,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5113/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=981,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5114/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=981,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5115/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=982,080,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5116/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=982,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5117/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=982,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5118/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=982,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5119/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=982,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5120/500000]
+ optim/total_grad_norm=0.9379
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=983,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5121/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=983,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5122/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=983,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5123/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=983,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5124/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=983,808,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5125/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=984,000,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5126/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=984,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5127/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=984,384,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5128/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=984,576,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5129/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=984,768,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5130/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=984,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5131/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=985,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5132/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=985,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5133/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=985,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5134/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=985,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5135/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=985,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5136/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=986,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5137/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=986,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5138/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=986,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5139/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=986,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5140/500000]
+ optim/total_grad_norm=1.263
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=986,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5141/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=987,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5142/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=987,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5143/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=987,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5144/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=987,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5145/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=987,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5146/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=988,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5147/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=988,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5148/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=988,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5149/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=988,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5150/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=988,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5151/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=988,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5152/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=989,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5153/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=989,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5154/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=989,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5155/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=989,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5156/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=989,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5157/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=990,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5158/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=990,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5159/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=990,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5160/500000]
+ optim/total_grad_norm=1.498
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=990,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5161/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=990,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5162/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=991,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5163/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=991,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5164/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=991,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5165/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=991,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5166/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=991,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5167/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=992,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5168/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=992,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5169/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=992,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5170/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=992,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5171/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=992,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5172/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=993,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5173/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=993,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5174/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=993,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5175/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=993,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5176/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=993,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5177/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=993,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5178/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=994,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5179/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=994,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5180/500000]
+ optim/total_grad_norm=1.471
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=994,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5181/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=994,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5182/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=994,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5183/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=995,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5184/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=995,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5185/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=995,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5186/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=995,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5187/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=995,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5188/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=996,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5189/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=996,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5190/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=996,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5191/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=996,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5192/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=996,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5193/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=997,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5194/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=997,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5195/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=997,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5196/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=997,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5197/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=997,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5198/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=998,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5199/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=998,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5200/500000]
+ optim/total_grad_norm=1.174
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=998,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5201/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=998,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5202/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=998,784,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=5203/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=998,976,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5204/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=999,168,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=5205/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=999,360,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5206/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=999,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5207/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=999,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5208/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=999,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5209/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,000,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5210/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,000,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5211/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,000,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5212/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,000,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5213/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,000,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5214/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,001,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5215/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,001,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5216/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,001,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5217/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,001,664,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5218/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,001,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5219/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=1,002,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5220/500000]
+ optim/total_grad_norm=1.176
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,002,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5221/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,002,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5222/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,002,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5223/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,002,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5224/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,003,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5225/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,003,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5226/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,003,392,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5227/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,003,584,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5228/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,003,776,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5229/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,003,968,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5230/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,004,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5231/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,004,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5232/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,004,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5233/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,004,736,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5234/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,004,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5235/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,005,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5236/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,005,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5237/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,005,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5238/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,005,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5239/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,005,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5240/500000]
+ optim/total_grad_norm=1.481
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,006,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5241/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,006,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5242/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,006,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5243/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,006,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5244/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,006,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5245/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,007,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5246/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,007,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5247/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,007,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5248/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,007,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5249/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,007,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5250/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,008,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5251/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,008,192,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5252/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,008,384,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5253/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,008,576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5254/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,008,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5255/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,008,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5256/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,009,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5257/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,009,344,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5258/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,009,536,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5259/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,009,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5260/500000]
+ optim/total_grad_norm=1.306
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,009,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5261/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,010,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5262/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,010,304,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5263/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,010,496,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=5264/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,010,688,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5265/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,010,880,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=5266/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,011,072,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5267/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,011,264,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5268/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,011,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5269/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,011,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5270/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,011,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5271/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,012,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5272/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,012,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5273/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,012,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5274/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,012,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5275/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,012,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5276/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,012,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5277/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=1,013,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5278/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,013,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5279/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,013,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5280/500000]
+ optim/total_grad_norm=1.472
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,013,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5281/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,013,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5282/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,014,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5283/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,014,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5284/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,014,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5285/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,014,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5286/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,014,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5287/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,015,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5288/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,015,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5289/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,015,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5290/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,015,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5291/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,015,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5292/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,016,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5293/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,016,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5294/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,016,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5295/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,016,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5296/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,016,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5297/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,017,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5298/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,017,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5299/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,017,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5300/500000]
+ optim/total_grad_norm=1.150
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,017,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5301/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,017,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5302/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=1,017,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5303/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,018,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5304/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,018,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5305/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,018,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5306/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,018,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5307/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,018,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5308/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,019,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5309/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,019,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5310/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=1,019,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5311/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,019,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5312/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,019,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5313/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,020,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5314/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,020,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5315/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,020,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5316/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,020,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5317/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,020,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5318/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,021,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5319/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,021,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5320/500000]
+ optim/total_grad_norm=0.9035
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,021,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5321/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,021,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5322/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,021,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5323/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,022,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5324/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,022,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5325/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,022,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5326/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,022,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5327/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,022,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5328/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,022,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5329/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,023,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5330/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,023,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5331/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,023,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5332/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,023,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5333/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,023,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5334/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,024,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5335/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,024,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5336/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,024,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5337/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,024,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5338/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,024,896,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5339/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,025,088,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5340/500000]
+ optim/total_grad_norm=1.217
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,025,280,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5341/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,025,472,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5342/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,025,664,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5343/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,025,856,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5344/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,026,048,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5345/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,026,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5346/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,026,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5347/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,026,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5348/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,026,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5349/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,027,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5350/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,027,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5351/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=1,027,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5352/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,027,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5353/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,027,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5354/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,027,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5355/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,028,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5356/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,028,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5357/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,028,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5358/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,028,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5359/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,028,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5360/500000]
+ optim/total_grad_norm=1.516
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,029,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5361/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,029,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5362/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,029,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5363/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,029,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5364/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,029,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5365/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,030,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5366/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,030,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5367/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,030,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5368/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,030,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5369/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,030,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5370/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,031,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5371/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,031,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5372/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,031,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5373/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,031,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5374/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,031,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5375/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,032,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5376/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,032,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5377/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,032,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5378/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,032,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5379/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,032,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5380/500000]
+ optim/total_grad_norm=1.883
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,032,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5381/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,033,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5382/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,033,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5383/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,033,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5384/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,033,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5385/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,033,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5386/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,034,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5387/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,034,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5388/500000]
+ train/ActionNoiseL2Loss=0.1473
+ throughput/total_tokens=1,034,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5389/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,034,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5390/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,034,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5391/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=1,035,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5392/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,035,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5393/500000]
+ train/ActionNoiseL2Loss=0.0129
+ throughput/total_tokens=1,035,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5394/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,035,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5395/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,035,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5396/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,036,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5397/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,036,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5398/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,036,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5399/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,036,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5400/500000]
+ optim/total_grad_norm=2.154
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,036,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5401/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,036,992,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5402/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,037,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5403/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,037,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5404/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,037,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5405/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,037,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5406/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,037,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5407/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=1,038,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5408/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,038,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5409/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,038,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5410/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,038,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5411/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,038,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5412/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,039,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5413/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,039,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5414/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,039,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5415/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,039,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5416/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,039,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5417/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,040,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5418/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,040,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5419/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,040,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5420/500000]
+ optim/total_grad_norm=0.9096
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,040,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5421/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,040,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5422/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,041,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5423/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,041,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5424/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,041,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5425/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,041,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5426/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,041,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5427/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,041,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5428/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,042,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5429/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,042,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5430/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,042,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5431/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,042,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5432/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,042,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5433/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,043,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5434/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,043,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5435/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,043,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5436/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,043,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5437/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,043,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5438/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,044,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5439/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,044,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5440/500000]
+ optim/total_grad_norm=1.539
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,044,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5441/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,044,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5442/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=1,044,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5443/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,045,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5444/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,045,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5445/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,045,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5446/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,045,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5447/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,045,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5448/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,046,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5449/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,046,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5450/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,046,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5451/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,046,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5452/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,046,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5453/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=1,046,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5454/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,047,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5455/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,047,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5456/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,047,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5457/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,047,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5458/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,047,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5459/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,048,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5460/500000]
+ optim/total_grad_norm=1.237
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,048,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5461/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=1,048,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5462/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,048,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5463/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,048,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5464/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,049,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5465/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,049,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5466/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,049,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5467/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,049,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5468/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,049,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5469/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,050,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5470/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,050,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5471/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,050,432,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5472/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,050,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5473/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,050,816,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5474/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,051,008,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5475/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,051,200,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5476/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,051,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5477/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,051,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5478/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,051,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5479/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,051,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5480/500000]
+ optim/total_grad_norm=1.479
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,052,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5481/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,052,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5482/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,052,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5483/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,052,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5484/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,052,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5485/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,053,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5486/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=1,053,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5487/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,053,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5488/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,053,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5489/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,053,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5490/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,054,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5491/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,054,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5492/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,054,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5493/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=1,054,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5494/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,054,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5495/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,055,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5496/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=1,055,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5497/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,055,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5498/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,055,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5499/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,055,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5500/500000]
+ optim/total_grad_norm=1.152
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,056,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/25 [17:26:49] INFO | >> Saving config... checkpoint.py:608
+09/25 [17:27:20] INFO | >> Saving model state... checkpoint.py:796
+09/25 [17:28:21] INFO | >> Saving optim state... checkpoint.py:811
+09/25 [17:28:26] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5501/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,056,192,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=5502/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,056,384,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5503/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,056,576,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=5504/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,056,768,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=5505/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,056,960,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=5506/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,057,152,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=5507/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,057,344,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=5508/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,057,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5509/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,057,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5510/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,057,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5511/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,058,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5512/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,058,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5513/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,058,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5514/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,058,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5515/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,058,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5516/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,059,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5517/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,059,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5518/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,059,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5519/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,059,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5520/500000]
+ optim/total_grad_norm=1.302
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,059,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5521/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,060,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5522/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,060,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5523/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,060,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5524/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,060,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5525/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,060,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5526/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,060,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5527/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,061,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5528/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,061,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5529/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,061,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5530/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,061,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5531/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,061,952,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5532/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,062,144,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5533/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,062,336,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5534/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,062,528,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5535/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,062,720,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5536/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,062,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5537/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,063,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5538/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,063,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5539/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,063,488,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5540/500000]
+ optim/total_grad_norm=1.352
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,063,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5541/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,063,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5542/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,064,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5543/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,064,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5544/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,064,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5545/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,064,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5546/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,064,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5547/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,065,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5548/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,065,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5549/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,065,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5550/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,065,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5551/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,065,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5552/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,065,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5553/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,066,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5554/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,066,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5555/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=1,066,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5556/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,066,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5557/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,066,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5558/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,067,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5559/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,067,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5560/500000]
+ optim/total_grad_norm=1.779
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,067,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5561/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,067,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5562/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,067,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5563/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,068,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5564/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,068,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5565/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,068,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5566/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,068,672,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5567/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,068,864,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5568/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,069,056,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5569/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,069,248,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=5570/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,069,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5571/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,069,632,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5572/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,069,824,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5573/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,070,016,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5574/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,070,208,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5575/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,070,400,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5576/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,070,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5577/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,070,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5578/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,070,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5579/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,071,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5580/500000]
+ optim/total_grad_norm=1.789
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,071,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5581/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,071,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5582/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,071,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5583/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=1,071,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5584/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,072,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5585/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,072,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5586/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,072,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5587/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,072,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5588/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,072,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5589/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,073,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5590/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,073,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5591/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,073,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5592/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,073,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5593/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,073,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5594/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=1,074,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5595/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,074,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5596/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,074,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5597/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,074,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5598/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,074,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5599/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,075,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5600/500000]
+ optim/total_grad_norm=1.634
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=1,075,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5601/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,075,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5602/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,075,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5603/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,075,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5604/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,075,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5605/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,076,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5606/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,076,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5607/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,076,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5608/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,076,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5609/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,076,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5610/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=1,077,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5611/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,077,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5612/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,077,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5613/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,077,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5614/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,077,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5615/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,078,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5616/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,078,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5617/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,078,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5618/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,078,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5619/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,078,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5620/500000]
+ optim/total_grad_norm=1.519
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,079,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5621/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,079,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5622/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,079,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5623/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,079,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5624/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,079,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5625/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,080,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5626/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,080,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5627/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=1,080,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5628/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,080,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5629/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,080,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5630/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,080,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5631/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,081,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5632/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,081,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5633/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,081,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5634/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,081,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5635/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,081,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5636/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,082,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5637/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,082,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5638/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,082,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5639/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,082,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5640/500000]
+ optim/total_grad_norm=1.368
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,082,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5641/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,083,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5642/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,083,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5643/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,083,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5644/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,083,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5645/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,083,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5646/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,084,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5647/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,084,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5648/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,084,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5649/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,084,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5650/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,084,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5651/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,084,992,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5652/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,085,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5653/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,085,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5654/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,085,568,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5655/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=1,085,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5656/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,085,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5657/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,086,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5658/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,086,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5659/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,086,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5660/500000]
+ optim/total_grad_norm=2.626
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=1,086,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5661/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,086,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5662/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,087,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5663/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,087,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5664/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,087,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5665/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,087,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5666/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,087,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5667/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,088,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5668/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,088,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5669/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,088,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5670/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,088,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5671/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,088,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5672/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,089,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5673/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,089,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5674/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,089,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5675/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,089,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5676/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,089,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5677/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,089,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5678/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,090,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5679/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,090,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5680/500000]
+ optim/total_grad_norm=1.420
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,090,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5681/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,090,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5682/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,090,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5683/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,091,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5684/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,091,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5685/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,091,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5686/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,091,712,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5687/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,091,904,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5688/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=1,092,096,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5689/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,092,288,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5690/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,092,480,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5691/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,092,672,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5692/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,092,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5693/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,093,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5694/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,093,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5695/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,093,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5696/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,093,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5697/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,093,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5698/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,094,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5699/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,094,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5700/500000]
+ optim/total_grad_norm=1.199
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,094,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5701/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,094,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5702/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,094,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5703/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,094,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5704/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,095,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5705/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,095,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5706/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,095,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5707/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,095,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5708/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,095,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5709/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,096,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5710/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,096,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5711/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,096,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5712/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,096,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5713/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,096,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5714/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,097,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5715/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,097,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5716/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,097,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5717/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,097,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5718/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,097,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5719/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,098,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5720/500000]
+ optim/total_grad_norm=1.202
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,098,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5721/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,098,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5722/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,098,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5723/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,098,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5724/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,099,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5725/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,099,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5726/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,099,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5727/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,099,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5728/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,099,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5729/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,099,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5730/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,100,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5731/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,100,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5732/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,100,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5733/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,100,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5734/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,100,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5735/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,101,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5736/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,101,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5737/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,101,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5738/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,101,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5739/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,101,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5740/500000]
+ optim/total_grad_norm=0.8947
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,102,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5741/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,102,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5742/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,102,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5743/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,102,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5744/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,102,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5745/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,103,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5746/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,103,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5747/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,103,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5748/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,103,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5749/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,103,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5750/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,104,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5751/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,104,192,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5752/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,104,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5753/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,104,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5754/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,104,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5755/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,104,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5756/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,105,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5757/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,105,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5758/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,105,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5759/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,105,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5760/500000]
+ optim/total_grad_norm=1.039
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,105,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5761/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,106,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5762/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,106,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5763/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,106,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5764/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,106,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5765/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,106,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5766/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,107,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5767/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,107,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5768/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,107,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5769/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,107,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5770/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,107,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5771/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,108,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5772/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,108,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5773/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,108,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5774/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,108,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5775/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,108,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5776/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,108,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5777/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,109,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5778/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,109,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5779/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,109,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5780/500000]
+ optim/total_grad_norm=1.728
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,109,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5781/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,109,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5782/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,110,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5783/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,110,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5784/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,110,528,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5785/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,110,720,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5786/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,110,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5787/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,111,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5788/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,111,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5789/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,111,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5790/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,111,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5791/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,111,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5792/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,112,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5793/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,112,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5794/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,112,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5795/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,112,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5796/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,112,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5797/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,113,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5798/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,113,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5799/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,113,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5800/500000]
+ optim/total_grad_norm=1.103
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,113,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5801/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,113,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5802/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,113,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5803/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,114,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5804/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,114,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5805/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,114,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5806/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,114,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5807/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,114,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5808/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,115,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5809/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,115,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5810/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,115,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5811/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,115,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5812/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,115,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5813/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,116,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5814/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,116,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5815/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,116,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5816/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,116,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5817/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,116,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5818/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,117,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5819/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,117,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5820/500000]
+ optim/total_grad_norm=0.9334
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,117,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5821/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,117,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5822/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,117,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5823/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,118,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5824/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,118,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5825/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,118,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5826/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,118,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5827/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,118,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5828/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,118,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5829/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,119,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5830/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,119,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5831/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,119,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5832/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,119,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5833/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,119,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5834/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,120,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5835/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,120,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5836/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,120,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5837/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,120,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5838/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,120,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5839/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,121,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5840/500000]
+ optim/total_grad_norm=1.142
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,121,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5841/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,121,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5842/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,121,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5843/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,121,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5844/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,122,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5845/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,122,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5846/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,122,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5847/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,122,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5848/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,122,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5849/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=1,123,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5850/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,123,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5851/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,123,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5852/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,123,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5853/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,123,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5854/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,123,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5855/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,124,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5856/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,124,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5857/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,124,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5858/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,124,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5859/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,124,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5860/500000]
+ optim/total_grad_norm=1.635
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,125,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5861/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,125,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5862/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,125,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5863/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=1,125,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5864/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,125,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5865/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,126,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5866/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,126,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=5867/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,126,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5868/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,126,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5869/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,126,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5870/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,127,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5871/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,127,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5872/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,127,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5873/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,127,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5874/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,127,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5875/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,128,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5876/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,128,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5877/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,128,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5878/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,128,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5879/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,128,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5880/500000]
+ optim/total_grad_norm=1.647
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,128,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5881/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=1,129,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5882/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,129,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5883/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,129,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5884/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,129,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5885/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,129,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5886/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,130,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5887/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,130,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=5888/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,130,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5889/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,130,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5890/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,130,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5891/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,131,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5892/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,131,264,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5893/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,131,456,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5894/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,131,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5895/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,131,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5896/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,132,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5897/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,132,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5898/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,132,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5899/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,132,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5900/500000]
+ optim/total_grad_norm=1.644
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,132,800,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5901/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,132,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5902/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,133,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5903/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,133,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5904/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=1,133,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5905/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,133,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5906/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,133,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5907/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,134,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5908/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,134,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5909/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,134,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=5910/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,134,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=5911/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,134,912,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5912/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,135,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5913/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,135,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5914/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,135,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5915/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,135,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5916/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,135,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5917/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,136,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5918/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,136,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5919/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,136,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5920/500000]
+ optim/total_grad_norm=1.765
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,136,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5921/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,136,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5922/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,137,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5923/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,137,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5924/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,137,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5925/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,137,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5926/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,137,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5927/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,137,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5928/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,138,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5929/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,138,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5930/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,138,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5931/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,138,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5932/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,138,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5933/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,139,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5934/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,139,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5935/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,139,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5936/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,139,712,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5937/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,139,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5938/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,140,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5939/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,140,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5940/500000]
+ optim/total_grad_norm=2.248
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,140,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5941/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,140,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5942/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,140,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5943/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,141,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5944/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,141,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5945/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,141,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5946/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,141,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5947/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=1,141,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5948/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,142,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5949/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,142,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=5950/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,142,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=5951/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,142,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5952/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,142,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=5953/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,142,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5954/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,143,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5955/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,143,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5956/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,143,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5957/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,143,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5958/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,143,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5959/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,144,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5960/500000]
+ optim/total_grad_norm=1.249
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,144,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=5961/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,144,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5962/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,144,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5963/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,144,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5964/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,145,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5965/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,145,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5966/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,145,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5967/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,145,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5968/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,145,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=5969/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,146,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=5970/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,146,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5971/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,146,432,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5972/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,146,624,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5973/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,146,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5974/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,147,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5975/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,147,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5976/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,147,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5977/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,147,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5978/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,147,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5979/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=1,147,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5980/500000]
+ optim/total_grad_norm=1.535
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,148,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5981/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,148,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5982/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,148,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5983/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,148,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5984/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,148,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5985/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,149,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5986/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,149,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5987/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,149,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5988/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,149,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5989/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,149,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=5990/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,150,080,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=5991/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,150,272,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5992/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,150,464,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5993/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,150,656,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5994/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,150,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5995/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,151,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5996/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,151,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5997/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,151,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5998/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,151,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=5999/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,151,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6000/500000]
+ optim/total_grad_norm=1.747
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,152,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/25 [20:27:03] INFO | >> Saving config... checkpoint.py:608
+09/25 [20:27:33] INFO | >> Saving model state... checkpoint.py:796
+09/25 [20:28:30] INFO | >> Saving optim state... checkpoint.py:811
+09/25 [20:28:35] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6001/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,152,192,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=6002/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,152,384,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=6003/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,152,576,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=6004/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,152,768,000
+ throughput/device/tokens_per_second=1,103
+ throughput/device/batches_per_second=0.0460
+[step=6005/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,152,960,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=6006/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,153,152,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=6007/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,153,344,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=6008/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,153,536,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=6009/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,153,728,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=6010/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,153,920,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,437
+[step=6011/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,154,112,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=6012/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,154,304,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=6013/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,154,496,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=6014/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,154,688,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=6015/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,154,880,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=6016/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,155,072,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=6017/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,155,264,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=6018/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,155,456,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=6019/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,155,648,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=6020/500000]
+ optim/total_grad_norm=0.9536
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,155,840,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=6021/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,156,032,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=6022/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,156,224,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6023/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,156,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6024/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,156,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6025/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,156,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6026/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,156,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6027/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,157,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6028/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,157,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6029/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,157,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6030/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,157,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6031/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,157,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6032/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,158,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6033/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,158,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6034/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,158,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6035/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,158,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6036/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,158,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6037/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,159,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6038/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,159,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6039/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=1,159,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6040/500000]
+ optim/total_grad_norm=0.9872
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,159,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6041/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,159,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6042/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,160,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6043/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,160,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6044/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,160,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6045/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,160,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6046/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,160,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6047/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,161,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6048/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,161,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6049/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,161,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6050/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,161,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6051/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,161,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6052/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,161,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6053/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,162,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6054/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,162,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6055/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,162,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6056/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,162,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6057/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,162,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6058/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,163,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6059/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,163,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6060/500000]
+ optim/total_grad_norm=1.406
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,163,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6061/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,163,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6062/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,163,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6063/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,164,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6064/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,164,288,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6065/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,164,480,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=6066/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,164,672,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=6067/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,164,864,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=6068/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,165,056,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=6069/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,165,248,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=6070/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,165,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6071/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,165,632,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6072/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,165,824,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6073/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,166,016,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6074/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,166,208,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6075/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,166,400,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6076/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,166,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6077/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,166,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6078/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,166,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6079/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,167,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6080/500000]
+ optim/total_grad_norm=1.624
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,167,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6081/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,167,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6082/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,167,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6083/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,167,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6084/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,168,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6085/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,168,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6086/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,168,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6087/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,168,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6088/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,168,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6089/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,169,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6090/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,169,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6091/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,169,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6092/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,169,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6093/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,169,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6094/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,170,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6095/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,170,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6096/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,170,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6097/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,170,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6098/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,170,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6099/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,171,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6100/500000]
+ optim/total_grad_norm=1.243
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,171,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6101/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,171,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6102/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,171,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6103/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,171,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6104/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,171,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6105/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,172,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6106/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,172,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6107/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,172,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6108/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,172,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6109/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,172,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6110/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,173,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6111/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,173,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6112/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,173,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6113/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,173,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6114/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=1,173,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6115/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,174,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6116/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,174,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6117/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,174,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6118/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,174,656,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6119/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,174,848,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6120/500000]
+ optim/total_grad_norm=2.010
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,175,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6121/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,175,232,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6122/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,175,424,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6123/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,175,616,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6124/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,175,808,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6125/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,176,000,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6126/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,176,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6127/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=1,176,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6128/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,176,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6129/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,176,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6130/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,176,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6131/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,177,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6132/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,177,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6133/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,177,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6134/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,177,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6135/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,177,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6136/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,178,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6137/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,178,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6138/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,178,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6139/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,178,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6140/500000]
+ optim/total_grad_norm=1.147
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,178,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6141/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,179,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6142/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,179,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6143/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,179,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6144/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,179,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6145/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=1,179,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6146/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,180,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6147/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,180,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6148/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,180,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6149/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,180,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6150/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,180,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6151/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,180,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6152/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,181,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6153/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,181,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6154/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,181,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6155/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,181,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6156/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,181,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6157/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,182,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6158/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,182,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6159/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,182,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6160/500000]
+ optim/total_grad_norm=2.407
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=1,182,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6161/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,182,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6162/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,183,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6163/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,183,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6164/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,183,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6165/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=1,183,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6166/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,183,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6167/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,184,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6168/500000]
+ train/ActionNoiseL2Loss=0.1607
+ throughput/total_tokens=1,184,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6169/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,184,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6170/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,184,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6171/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,184,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6172/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,185,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6173/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,185,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6174/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,185,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6175/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,185,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6176/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=1,185,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6177/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,185,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6178/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,186,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6179/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,186,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6180/500000]
+ optim/total_grad_norm=1.749
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=1,186,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6181/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,186,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6182/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,186,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6183/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,187,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6184/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=1,187,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6185/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,187,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6186/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,187,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6187/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,187,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6188/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,188,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6189/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,188,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6190/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,188,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6191/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,188,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6192/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,188,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6193/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,189,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6194/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=1,189,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6195/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,189,440,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6196/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,189,632,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6197/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,189,824,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6198/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=1,190,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6199/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,190,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6200/500000]
+ optim/total_grad_norm=1.411
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,190,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6201/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,190,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6202/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,190,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6203/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,190,976,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6204/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,191,168,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6205/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,191,360,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6206/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,191,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6207/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,191,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6208/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,191,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6209/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,192,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6210/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,192,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6211/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,192,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6212/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,192,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6213/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,192,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6214/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,193,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6215/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,193,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6216/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,193,472,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6217/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=1,193,664,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6218/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,193,856,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6219/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,194,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6220/500000]
+ optim/total_grad_norm=1.021
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,194,240,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6221/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,194,432,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6222/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,194,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6223/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,194,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6224/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,195,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6225/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,195,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6226/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=1,195,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6227/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,195,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6228/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=1,195,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6229/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,195,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6230/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,196,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6231/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,196,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6232/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,196,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6233/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,196,736,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6234/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,196,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6235/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=1,197,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6236/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,197,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6237/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,197,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6238/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,197,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6239/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,197,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6240/500000]
+ optim/total_grad_norm=1.263
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,198,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6241/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,198,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6242/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,198,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6243/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,198,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6244/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,198,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6245/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,199,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6246/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,199,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6247/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,199,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6248/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,199,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6249/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,199,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6250/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,200,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6251/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,200,192,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6252/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,200,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6253/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,200,576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6254/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,200,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6255/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,200,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6256/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,201,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6257/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,201,344,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6258/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,201,536,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6259/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,201,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6260/500000]
+ optim/total_grad_norm=0.9992
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,201,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6261/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,202,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6262/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,202,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6263/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,202,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6264/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,202,688,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6265/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,202,880,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6266/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,203,072,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6267/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,203,264,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6268/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,203,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6269/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,203,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6270/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,203,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6271/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,204,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6272/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,204,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6273/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,204,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6274/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,204,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6275/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,204,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6276/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,204,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6277/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,205,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6278/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,205,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6279/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,205,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6280/500000]
+ optim/total_grad_norm=1.109
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,205,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6281/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,205,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6282/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,206,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6283/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,206,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6284/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,206,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6285/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,206,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6286/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,206,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6287/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,207,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6288/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,207,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6289/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,207,488,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6290/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,207,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6291/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,207,872,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6292/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,208,064,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6293/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,208,256,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6294/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,208,448,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6295/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,208,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6296/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,208,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6297/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,209,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6298/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,209,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6299/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,209,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6300/500000]
+ optim/total_grad_norm=1.888
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,209,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6301/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,209,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6302/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,209,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6303/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,210,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6304/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,210,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6305/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,210,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6306/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,210,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6307/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,210,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6308/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,211,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6309/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,211,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6310/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,211,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6311/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,211,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6312/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,211,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6313/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,212,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6314/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,212,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6315/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,212,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6316/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,212,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6317/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,212,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6318/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,213,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6319/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,213,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6320/500000]
+ optim/total_grad_norm=1.753
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,213,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6321/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,213,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6322/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,213,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6323/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,214,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6324/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=1,214,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6325/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,214,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6326/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,214,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6327/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,214,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6328/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,214,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6329/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,215,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6330/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,215,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6331/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,215,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6332/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,215,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6333/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,215,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6334/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,216,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6335/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,216,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6336/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,216,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6337/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,216,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6338/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,216,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6339/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,217,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6340/500000]
+ optim/total_grad_norm=0.8489
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,217,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6341/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,217,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6342/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,217,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6343/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,217,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6344/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,218,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6345/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,218,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6346/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,218,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6347/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,218,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6348/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,218,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6349/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,219,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6350/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,219,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6351/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,219,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6352/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,219,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6353/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,219,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6354/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,219,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6355/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,220,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6356/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,220,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6357/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,220,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6358/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,220,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6359/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,220,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6360/500000]
+ optim/total_grad_norm=3.281
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=1,221,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6361/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,221,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6362/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,221,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6363/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,221,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6364/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,221,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6365/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,222,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6366/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,222,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6367/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,222,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6368/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,222,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6369/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,222,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6370/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,223,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6371/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,223,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6372/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,223,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6373/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,223,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6374/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,223,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6375/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,224,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6376/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,224,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6377/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,224,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6378/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,224,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6379/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,224,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6380/500000]
+ optim/total_grad_norm=1.486
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,224,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6381/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,225,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6382/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,225,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6383/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,225,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6384/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,225,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6385/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,225,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6386/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,226,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6387/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,226,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6388/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,226,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6389/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,226,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6390/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,226,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6391/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,227,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6392/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,227,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6393/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,227,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6394/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,227,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6395/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,227,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6396/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,228,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6397/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,228,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6398/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,228,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6399/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,228,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6400/500000]
+ optim/total_grad_norm=1.081
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,228,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6401/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,228,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6402/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,229,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6403/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,229,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6404/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,229,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6405/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,229,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6406/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,229,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6407/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,230,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6408/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,230,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6409/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,230,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6410/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,230,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6411/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,230,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6412/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,231,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6413/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,231,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6414/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,231,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6415/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,231,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6416/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,231,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6417/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,232,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6418/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,232,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6419/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,232,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6420/500000]
+ optim/total_grad_norm=0.9529
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,232,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6421/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,232,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6422/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,233,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6423/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,233,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6424/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,233,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6425/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,233,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6426/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,233,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6427/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,233,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6428/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,234,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6429/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,234,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6430/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,234,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6431/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,234,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6432/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,234,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6433/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,235,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6434/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,235,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6435/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,235,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6436/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,235,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6437/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,235,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6438/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,236,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6439/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,236,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6440/500000]
+ optim/total_grad_norm=1.299
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,236,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6441/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,236,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6442/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,236,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6443/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,237,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6444/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,237,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6445/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,237,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6446/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,237,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6447/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,237,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6448/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,238,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6449/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,238,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6450/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,238,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6451/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,238,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6452/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,238,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6453/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,238,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6454/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,239,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6455/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,239,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6456/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,239,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6457/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,239,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6458/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,239,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6459/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,240,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6460/500000]
+ optim/total_grad_norm=2.020
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=1,240,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6461/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,240,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6462/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=1,240,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6463/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,240,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6464/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,241,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6465/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,241,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6466/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,241,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6467/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=1,241,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6468/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,241,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6469/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,242,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6470/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,242,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6471/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,242,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6472/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,242,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6473/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,242,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6474/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,243,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6475/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,243,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6476/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,243,392,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6477/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,243,584,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6478/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,243,776,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6479/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,243,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6480/500000]
+ optim/total_grad_norm=0.7953
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,244,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6481/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,244,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6482/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,244,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6483/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,244,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6484/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,244,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6485/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,245,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6486/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,245,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6487/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,245,504,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6488/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,245,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6489/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,245,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6490/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,246,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6491/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,246,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6492/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,246,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6493/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,246,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6494/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,246,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6495/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,247,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6496/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,247,232,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6497/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,247,424,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6498/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,247,616,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6499/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,247,808,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6500/500000]
+ optim/total_grad_norm=1.497
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,248,000,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/25 [23:27:10] INFO | >> Saving config... checkpoint.py:608
+09/25 [23:27:43] INFO | >> Saving model state... checkpoint.py:796
+09/25 [23:28:44] INFO | >> Saving optim state... checkpoint.py:811
+09/25 [23:28:50] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6501/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,248,192,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=6502/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,248,384,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=6503/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,248,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6504/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,248,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6505/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,248,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6506/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,249,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6507/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,249,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6508/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,249,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6509/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,249,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6510/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,249,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6511/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,250,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6512/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,250,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6513/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,250,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6514/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,250,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6515/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,250,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6516/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,251,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6517/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=1,251,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6518/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,251,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6519/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,251,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6520/500000]
+ optim/total_grad_norm=1.809
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,251,840,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6521/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,252,032,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6522/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,252,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6523/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,252,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6524/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,252,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6525/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,252,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6526/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,252,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6527/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,253,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6528/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,253,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6529/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,253,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6530/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,253,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6531/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=1,253,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6532/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,254,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6533/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,254,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6534/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,254,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6535/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,254,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6536/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,254,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6537/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,255,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6538/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,255,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6539/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,255,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6540/500000]
+ optim/total_grad_norm=1.260
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,255,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6541/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,255,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6542/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,256,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6543/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,256,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6544/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,256,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6545/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,256,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6546/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,256,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6547/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,257,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6548/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,257,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6549/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,257,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6550/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,257,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6551/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,257,792,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6552/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,257,984,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6553/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,258,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6554/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,258,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6555/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,258,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6556/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,258,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6557/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,258,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6558/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,259,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6559/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,259,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6560/500000]
+ optim/total_grad_norm=1.746
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,259,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6561/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,259,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6562/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,259,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6563/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,260,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6564/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,260,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6565/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,260,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6566/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,260,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6567/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,260,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6568/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,261,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6569/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,261,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6570/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,261,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6571/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,261,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6572/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,261,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6573/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,262,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6574/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,262,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6575/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,262,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6576/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,262,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6577/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,262,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6578/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,262,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6579/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,263,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6580/500000]
+ optim/total_grad_norm=1.159
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,263,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6581/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,263,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6582/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,263,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6583/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,263,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6584/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,264,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6585/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,264,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6586/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,264,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6587/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,264,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6588/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,264,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6589/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,265,088,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6590/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,265,280,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6591/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,265,472,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6592/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,265,664,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6593/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,265,856,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6594/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=1,266,048,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6595/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,266,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6596/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,266,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6597/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,266,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6598/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,266,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6599/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=1,267,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6600/500000]
+ optim/total_grad_norm=1.413
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,267,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6601/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,267,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6602/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,267,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6603/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,267,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6604/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,267,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6605/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,268,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6606/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,268,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6607/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,268,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6608/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,268,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6609/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,268,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6610/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,269,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6611/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,269,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6612/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,269,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6613/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,269,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6614/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,269,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6615/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,270,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6616/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,270,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6617/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,270,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6618/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,270,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6619/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,270,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6620/500000]
+ optim/total_grad_norm=1.177
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,271,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6621/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,271,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6622/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,271,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6623/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,271,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6624/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,271,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6625/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,272,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6626/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,272,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6627/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,272,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6628/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,272,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6629/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,272,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6630/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,272,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6631/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,273,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6632/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,273,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6633/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,273,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6634/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,273,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6635/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,273,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6636/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,274,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6637/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,274,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6638/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,274,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6639/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,274,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6640/500000]
+ optim/total_grad_norm=1.007
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,274,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6641/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,275,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6642/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,275,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6643/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,275,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6644/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,275,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6645/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,275,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6646/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,276,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6647/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,276,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6648/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,276,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6649/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,276,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6650/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,276,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6651/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,276,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6652/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,277,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6653/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,277,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6654/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,277,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6655/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,277,760,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6656/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,277,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6657/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,278,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6658/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,278,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6659/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,278,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6660/500000]
+ optim/total_grad_norm=0.8762
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,278,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6661/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,278,912,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6662/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,279,104,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6663/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,279,296,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6664/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,279,488,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6665/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,279,680,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6666/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,279,872,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6667/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,280,064,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6668/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=1,280,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6669/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,280,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6670/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,280,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6671/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,280,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6672/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=1,281,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6673/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,281,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6674/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,281,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6675/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,281,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6676/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,281,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6677/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,281,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6678/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,282,176,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6679/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,282,368,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6680/500000]
+ optim/total_grad_norm=1.288
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,282,560,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6681/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,282,752,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6682/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,282,944,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6683/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,283,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6684/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,283,328,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6685/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,283,520,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6686/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,283,712,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6687/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,283,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6688/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,284,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6689/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,284,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6690/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,284,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6691/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,284,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6692/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,284,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6693/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,285,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6694/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,285,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6695/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,285,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6696/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,285,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6697/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=1,285,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6698/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=1,286,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6699/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,286,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6700/500000]
+ optim/total_grad_norm=1.277
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,286,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6701/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,286,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6702/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=1,286,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6703/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,286,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6704/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,287,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6705/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,287,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6706/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,287,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6707/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,287,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6708/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,287,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6709/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,288,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6710/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,288,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6711/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,288,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6712/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,288,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6713/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=1,288,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6714/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,289,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6715/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,289,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6716/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,289,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6717/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,289,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6718/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,289,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6719/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,290,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6720/500000]
+ optim/total_grad_norm=1.323
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,290,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6721/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,290,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6722/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,290,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6723/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,290,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6724/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,291,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6725/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,291,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6726/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,291,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6727/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,291,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6728/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,291,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6729/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,291,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6730/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,292,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6731/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=1,292,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6732/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,292,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6733/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,292,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6734/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,292,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6735/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,293,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6736/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,293,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6737/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,293,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6738/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,293,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6739/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,293,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6740/500000]
+ optim/total_grad_norm=1.538
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,294,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6741/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,294,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6742/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,294,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6743/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,294,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6744/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,294,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6745/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=1,295,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6746/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,295,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6747/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,295,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6748/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,295,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6749/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,295,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6750/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,296,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6751/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,296,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6752/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,296,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6753/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,296,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6754/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,296,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6755/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,296,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6756/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,297,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6757/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,297,344,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6758/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,297,536,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6759/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,297,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6760/500000]
+ optim/total_grad_norm=1.222
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,297,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6761/500000]
+ train/ActionNoiseL2Loss=0.1612
+ throughput/total_tokens=1,298,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6762/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,298,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6763/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,298,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6764/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,298,688,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6765/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,298,880,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6766/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,299,072,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6767/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,299,264,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6768/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,299,456,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6769/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,299,648,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6770/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,299,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6771/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,300,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6772/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,300,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6773/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,300,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6774/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,300,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6775/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,300,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6776/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,300,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6777/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,301,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6778/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,301,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6779/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,301,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6780/500000]
+ optim/total_grad_norm=1.695
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,301,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6781/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,301,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6782/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,302,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6783/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,302,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6784/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,302,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6785/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=1,302,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6786/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,302,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6787/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,303,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6788/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,303,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6789/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,303,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6790/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,303,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6791/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,303,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6792/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,304,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6793/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,304,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6794/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,304,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6795/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,304,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6796/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,304,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6797/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,305,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6798/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,305,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=6799/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,305,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6800/500000]
+ optim/total_grad_norm=1.539
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,305,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=6801/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,305,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6802/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,305,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6803/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,306,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6804/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,306,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6805/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,306,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6806/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,306,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6807/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,306,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6808/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,307,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6809/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=1,307,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6810/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,307,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6811/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,307,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6812/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,307,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6813/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,308,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6814/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,308,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6815/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,308,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6816/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,308,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6817/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,308,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6818/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,309,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6819/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,309,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6820/500000]
+ optim/total_grad_norm=1.341
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,309,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6821/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=1,309,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6822/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,309,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6823/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,310,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6824/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,310,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6825/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,310,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6826/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,310,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6827/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,310,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6828/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,310,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6829/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,311,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6830/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,311,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6831/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=1,311,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6832/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,311,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6833/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,311,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6834/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,312,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6835/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,312,320,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6836/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,312,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6837/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,312,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6838/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=1,312,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6839/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,313,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6840/500000]
+ optim/total_grad_norm=1.162
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,313,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6841/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,313,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6842/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,313,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6843/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,313,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6844/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,314,048,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6845/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,314,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6846/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,314,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6847/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,314,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6848/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,314,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6849/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,315,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6850/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,315,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6851/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,315,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6852/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,315,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6853/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,315,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6854/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,315,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6855/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,316,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6856/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,316,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6857/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,316,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6858/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,316,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6859/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,316,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6860/500000]
+ optim/total_grad_norm=1.713
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,317,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6861/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,317,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6862/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,317,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6863/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,317,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6864/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,317,888,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6865/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,318,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6866/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,318,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6867/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,318,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6868/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,318,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6869/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,318,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6870/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,319,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6871/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,319,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6872/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,319,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6873/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,319,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6874/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,319,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6875/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,320,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6876/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,320,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6877/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,320,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6878/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,320,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6879/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,320,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6880/500000]
+ optim/total_grad_norm=0.9854
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,320,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6881/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,321,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6882/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,321,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6883/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,321,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6884/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,321,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6885/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,321,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6886/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=1,322,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6887/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,322,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6888/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,322,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6889/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,322,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6890/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,322,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6891/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,323,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6892/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,323,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6893/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,323,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6894/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,323,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=6895/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,323,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6896/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,324,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6897/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,324,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6898/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,324,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6899/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,324,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6900/500000]
+ optim/total_grad_norm=1.155
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,324,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6901/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=1,324,992,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6902/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,325,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6903/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,325,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6904/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,325,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6905/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,325,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6906/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,325,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6907/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,326,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6908/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,326,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6909/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,326,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6910/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=1,326,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6911/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,326,912,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6912/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,327,104,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6913/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,327,296,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6914/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,327,488,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6915/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,327,680,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6916/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,327,872,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6917/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,328,064,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6918/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,328,256,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6919/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,328,448,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=6920/500000]
+ optim/total_grad_norm=1.611
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,328,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6921/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,328,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6922/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,329,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6923/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,329,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6924/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,329,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6925/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,329,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6926/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,329,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6927/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,329,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6928/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,330,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6929/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,330,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6930/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,330,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6931/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,330,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6932/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,330,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6933/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,331,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6934/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,331,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6935/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,331,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6936/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,331,712,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6937/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,331,904,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6938/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=1,332,096,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6939/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,332,288,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6940/500000]
+ optim/total_grad_norm=0.6495
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,332,480,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6941/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,332,672,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6942/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,332,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6943/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,333,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6944/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,333,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6945/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,333,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6946/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,333,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6947/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,333,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6948/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,334,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6949/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,334,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6950/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,334,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6951/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,334,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6952/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,334,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6953/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,334,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6954/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,335,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6955/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,335,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6956/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,335,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6957/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,335,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6958/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,335,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6959/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,336,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6960/500000]
+ optim/total_grad_norm=1.147
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,336,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6961/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,336,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6962/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,336,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6963/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,336,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6964/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=1,337,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6965/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=1,337,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6966/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,337,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6967/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,337,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6968/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,337,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6969/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,338,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=6970/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=1,338,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6971/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,338,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6972/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,338,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6973/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,338,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=6974/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,339,008,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6975/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,339,200,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6976/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,339,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6977/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,339,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6978/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,339,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6979/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,339,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6980/500000]
+ optim/total_grad_norm=1.266
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,340,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=6981/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,340,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6982/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,340,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6983/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,340,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6984/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,340,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6985/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,341,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6986/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,341,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6987/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,341,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6988/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,341,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6989/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,341,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6990/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,342,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=6991/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,342,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6992/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,342,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6993/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,342,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6994/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=1,342,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6995/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,343,040,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=6996/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,343,232,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=6997/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,343,424,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6998/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=1,343,616,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=6999/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,343,808,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7000/500000]
+ optim/total_grad_norm=1.085
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,344,000,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/26 [02:27:31] INFO | >> Saving config... checkpoint.py:608
+09/26 [02:28:02] INFO | >> Saving model state... checkpoint.py:796
+09/26 [02:29:02] INFO | >> Saving optim state... checkpoint.py:811
+09/26 [02:29:07] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7001/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,344,192,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=7002/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,344,384,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7003/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,344,576,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=7004/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,344,768,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=7005/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,344,960,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=7006/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,345,152,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=7007/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,345,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7008/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,345,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7009/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,345,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7010/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,345,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7011/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,346,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7012/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,346,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7013/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,346,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7014/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,346,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7015/500000]
+ train/ActionNoiseL2Loss=0.1714
+ throughput/total_tokens=1,346,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7016/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,347,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7017/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,347,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7018/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,347,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7019/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,347,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7020/500000]
+ optim/total_grad_norm=0.7685
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,347,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7021/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=1,348,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7022/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,348,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7023/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,348,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7024/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,348,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7025/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,348,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7026/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=1,348,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7027/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,349,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7028/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,349,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7029/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,349,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7030/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,349,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7031/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,349,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7032/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,350,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7033/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,350,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7034/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,350,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7035/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,350,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7036/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,350,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7037/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,351,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7038/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,351,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7039/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,351,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7040/500000]
+ optim/total_grad_norm=1.315
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,351,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7041/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,351,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7042/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,352,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7043/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,352,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7044/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,352,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7045/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=1,352,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7046/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,352,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7047/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,353,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7048/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,353,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7049/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,353,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7050/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,353,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7051/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,353,792,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7052/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,353,984,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=7053/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,354,176,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=7054/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,354,368,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=7055/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,354,560,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=7056/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,354,752,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=7057/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,354,944,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7058/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,355,136,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7059/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,355,328,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7060/500000]
+ optim/total_grad_norm=1.535
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,355,520,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=7061/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,355,712,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=7062/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,355,904,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7063/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,356,096,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7064/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,356,288,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7065/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,356,480,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7066/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,356,672,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7067/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,356,864,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7068/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,357,056,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7069/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,357,248,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7070/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,357,440,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7071/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=1,357,632,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7072/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,357,824,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7073/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,358,016,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7074/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,358,208,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7075/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,358,400,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7076/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,358,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7077/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,358,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7078/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,358,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7079/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=1,359,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7080/500000]
+ optim/total_grad_norm=1.405
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,359,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7081/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=1,359,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7082/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,359,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7083/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,359,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7084/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,360,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7085/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,360,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7086/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,360,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7087/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,360,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7088/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,360,896,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7089/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,361,088,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7090/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,361,280,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7091/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,361,472,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7092/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,361,664,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7093/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,361,856,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7094/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,362,048,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7095/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,362,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7096/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,362,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7097/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,362,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7098/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,362,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7099/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,363,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7100/500000]
+ optim/total_grad_norm=1.079
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,363,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7101/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,363,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7102/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,363,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7103/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,363,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7104/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,363,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7105/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,364,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7106/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,364,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7107/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,364,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7108/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,364,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7109/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,364,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7110/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,365,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7111/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,365,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7112/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,365,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7113/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,365,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7114/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,365,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7115/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,366,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7116/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,366,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7117/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,366,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7118/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,366,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7119/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,366,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7120/500000]
+ optim/total_grad_norm=1.258
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,367,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7121/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,367,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7122/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,367,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7123/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,367,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7124/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,367,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7125/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,368,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7126/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,368,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7127/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,368,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7128/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,368,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7129/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,368,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7130/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,368,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7131/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,369,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7132/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,369,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7133/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,369,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7134/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,369,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7135/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,369,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7136/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,370,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7137/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,370,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7138/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,370,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7139/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,370,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7140/500000]
+ optim/total_grad_norm=1.218
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,370,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7141/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,371,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7142/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,371,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7143/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,371,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7144/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,371,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7145/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,371,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7146/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,372,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7147/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,372,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7148/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,372,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7149/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,372,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7150/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,372,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7151/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,372,992,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7152/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,373,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7153/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,373,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7154/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,373,568,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7155/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,373,760,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7156/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,373,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7157/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,374,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7158/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,374,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7159/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,374,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7160/500000]
+ optim/total_grad_norm=0.9760
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,374,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7161/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=1,374,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7162/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,375,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7163/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,375,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7164/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,375,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7165/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,375,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7166/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,375,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7167/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,376,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7168/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,376,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7169/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,376,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7170/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,376,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7171/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,376,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7172/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,377,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7173/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,377,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7174/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,377,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7175/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,377,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7176/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,377,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7177/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,377,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7178/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,378,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7179/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,378,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7180/500000]
+ optim/total_grad_norm=0.9063
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,378,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7181/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,378,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7182/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,378,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7183/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,379,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7184/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,379,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7185/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,379,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7186/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=1,379,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7187/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,379,904,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7188/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,380,096,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7189/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,380,288,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7190/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,380,480,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7191/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,380,672,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7192/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,380,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7193/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,381,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7194/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,381,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7195/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,381,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7196/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,381,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7197/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,381,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7198/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,382,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7199/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,382,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7200/500000]
+ optim/total_grad_norm=2.183
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=1,382,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7201/500000]
+ train/ActionNoiseL2Loss=0.1271
+ throughput/total_tokens=1,382,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7202/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,382,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7203/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,382,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7204/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,383,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7205/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,383,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7206/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,383,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7207/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,383,744,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7208/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,383,936,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7209/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,384,128,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7210/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,384,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7211/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,384,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7212/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,384,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7213/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,384,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7214/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,385,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7215/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,385,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7216/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,385,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7217/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,385,664,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7218/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,385,856,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7219/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,386,048,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7220/500000]
+ optim/total_grad_norm=1.180
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,386,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7221/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,386,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7222/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,386,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7223/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,386,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7224/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,387,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7225/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,387,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7226/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,387,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7227/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,387,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7228/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,387,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7229/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,387,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7230/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,388,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7231/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,388,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7232/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,388,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7233/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,388,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7234/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,388,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7235/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,389,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7236/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,389,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7237/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,389,504,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7238/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,389,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7239/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,389,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7240/500000]
+ optim/total_grad_norm=1.391
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,390,080,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7241/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,390,272,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7242/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,390,464,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7243/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,390,656,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7244/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,390,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7245/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,391,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7246/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=1,391,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7247/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,391,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7248/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,391,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7249/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,391,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7250/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,392,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7251/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,392,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7252/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,392,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7253/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,392,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7254/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,392,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7255/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,392,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7256/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,393,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7257/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,393,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7258/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,393,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7259/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,393,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7260/500000]
+ optim/total_grad_norm=2.053
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,393,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7261/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,394,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7262/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,394,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7263/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,394,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7264/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,394,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7265/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,394,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7266/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,395,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7267/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,395,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7268/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,395,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7269/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,395,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7270/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,395,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7271/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,396,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7272/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,396,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7273/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,396,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7274/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,396,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7275/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,396,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7276/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,396,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7277/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,397,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7278/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,397,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7279/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,397,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7280/500000]
+ optim/total_grad_norm=1.119
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,397,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7281/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,397,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7282/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,398,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7283/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,398,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7284/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,398,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7285/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,398,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7286/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,398,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7287/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,399,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7288/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,399,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7289/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,399,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7290/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,399,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7291/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,399,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7292/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=1,400,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7293/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,400,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7294/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,400,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7295/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,400,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7296/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,400,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7297/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,401,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7298/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,401,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7299/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,401,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7300/500000]
+ optim/total_grad_norm=1.186
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,401,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7301/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,401,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7302/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,401,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7303/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,402,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7304/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,402,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7305/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,402,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7306/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,402,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7307/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,402,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7308/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,403,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7309/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,403,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7310/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,403,520,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7311/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,403,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7312/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,403,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7313/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=1,404,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7314/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,404,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7315/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,404,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7316/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,404,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7317/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,404,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7318/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=1,405,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7319/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,405,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7320/500000]
+ optim/total_grad_norm=1.634
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,405,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7321/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,405,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7322/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,405,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7323/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,406,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7324/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,406,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7325/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=1,406,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7326/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,406,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7327/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,406,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7328/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,406,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7329/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,407,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7330/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,407,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7331/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,407,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7332/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,407,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7333/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,407,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7334/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,408,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7335/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,408,320,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7336/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,408,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7337/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,408,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7338/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,408,896,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7339/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,409,088,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7340/500000]
+ optim/total_grad_norm=1.312
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,409,280,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7341/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,409,472,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7342/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,409,664,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7343/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,409,856,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7344/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,410,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7345/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=1,410,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7346/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,410,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7347/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,410,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7348/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,410,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7349/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,411,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7350/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,411,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7351/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,411,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7352/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,411,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7353/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,411,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7354/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,411,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7355/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,412,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7356/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,412,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7357/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,412,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7358/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,412,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7359/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,412,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7360/500000]
+ optim/total_grad_norm=0.7388
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,413,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7361/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,413,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7362/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,413,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7363/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,413,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7364/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,413,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7365/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,414,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7366/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,414,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7367/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,414,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7368/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,414,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7369/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,414,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7370/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,415,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7371/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,415,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7372/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,415,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7373/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,415,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7374/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,415,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7375/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,416,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7376/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,416,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7377/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,416,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7378/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,416,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7379/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,416,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7380/500000]
+ optim/total_grad_norm=1.317
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,416,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7381/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,417,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7382/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,417,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7383/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,417,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7384/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,417,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7385/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,417,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7386/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,418,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7387/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,418,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7388/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,418,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7389/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,418,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7390/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,418,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7391/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,419,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7392/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,419,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7393/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,419,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7394/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,419,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7395/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,419,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7396/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,420,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7397/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,420,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7398/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,420,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7399/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,420,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7400/500000]
+ optim/total_grad_norm=0.8308
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,420,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7401/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,420,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7402/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,421,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7403/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,421,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7404/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,421,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7405/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,421,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7406/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,421,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7407/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,422,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7408/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,422,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7409/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,422,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7410/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,422,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7411/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,422,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7412/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,423,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7413/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,423,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7414/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,423,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7415/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,423,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7416/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,423,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7417/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,424,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7418/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,424,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7419/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,424,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7420/500000]
+ optim/total_grad_norm=1.114
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,424,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7421/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,424,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7422/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,425,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7423/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,425,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7424/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,425,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7425/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,425,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7426/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,425,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7427/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,425,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7428/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,426,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7429/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,426,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7430/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,426,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7431/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,426,752,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7432/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,426,944,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7433/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,427,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7434/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,427,328,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7435/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,427,520,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7436/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,427,712,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7437/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,427,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7438/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,428,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7439/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,428,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7440/500000]
+ optim/total_grad_norm=0.7453
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,428,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7441/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,428,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7442/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=1,428,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7443/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,429,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7444/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,429,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7445/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,429,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7446/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,429,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7447/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,429,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7448/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,430,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7449/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,430,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7450/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,430,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7451/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,430,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7452/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,430,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7453/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,430,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7454/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,431,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7455/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,431,360,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7456/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,431,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7457/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,431,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7458/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,431,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7459/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,432,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7460/500000]
+ optim/total_grad_norm=1.367
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,432,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7461/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,432,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7462/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,432,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7463/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=1,432,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7464/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,433,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7465/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,433,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7466/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,433,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7467/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,433,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7468/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,433,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7469/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,434,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7470/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,434,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7471/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,434,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7472/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,434,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7473/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,434,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7474/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,435,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7475/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,435,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7476/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,435,392,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7477/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,435,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7478/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,435,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7479/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,435,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7480/500000]
+ optim/total_grad_norm=1.448
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,436,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7481/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,436,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7482/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,436,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7483/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,436,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7484/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,436,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7485/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,437,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7486/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,437,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7487/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,437,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7488/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,437,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7489/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,437,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7490/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,438,080,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7491/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,438,272,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7492/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,438,464,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7493/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,438,656,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7494/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,438,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7495/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,439,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7496/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,439,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7497/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,439,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7498/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,439,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7499/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,439,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7500/500000]
+ optim/total_grad_norm=1.301
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,440,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/26 [05:27:41] INFO | >> Saving config... checkpoint.py:608
+09/26 [05:28:17] INFO | >> Saving model state... checkpoint.py:796
+09/26 [05:29:19] INFO | >> Saving optim state... checkpoint.py:811
+09/26 [05:29:24] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7501/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,440,192,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=7502/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,440,384,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=7503/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,440,576,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=7504/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,440,768,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=7505/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,440,960,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=7506/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,441,152,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=7507/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,441,344,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7508/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,441,536,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7509/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,441,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7510/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,441,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7511/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,442,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7512/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,442,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7513/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,442,496,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7514/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,442,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7515/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,442,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7516/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=1,443,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7517/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,443,264,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7518/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,443,456,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7519/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,443,648,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7520/500000]
+ optim/total_grad_norm=1.838
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,443,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7521/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,444,032,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7522/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,444,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7523/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,444,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7524/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,444,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7525/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,444,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7526/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,444,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7527/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,445,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7528/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=1,445,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7529/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,445,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7530/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,445,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7531/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,445,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7532/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,446,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7533/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,446,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7534/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,446,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7535/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,446,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7536/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,446,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7537/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,447,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7538/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=1,447,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7539/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,447,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7540/500000]
+ optim/total_grad_norm=1.111
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,447,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7541/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,447,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7542/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,448,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7543/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,448,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7544/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,448,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7545/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,448,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7546/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,448,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7547/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,449,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7548/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,449,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7549/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,449,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7550/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,449,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7551/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,449,792,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=7552/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,449,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=7553/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,450,176,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=7554/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,450,368,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=7555/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=1,450,560,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=7556/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,450,752,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=7557/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,450,944,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=7558/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,451,136,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=7559/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,451,328,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=7560/500000]
+ optim/total_grad_norm=1.097
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,451,520,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,437
+[step=7561/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,451,712,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=7562/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,451,904,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=7563/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,452,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=7564/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,452,288,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=7565/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,452,480,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=7566/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,452,672,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=7567/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,452,864,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=7568/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,453,056,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=7569/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,453,248,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=7570/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,453,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7571/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,453,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7572/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=1,453,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7573/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,454,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7574/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,454,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7575/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,454,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7576/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,454,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7577/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,454,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7578/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,454,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7579/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,455,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7580/500000]
+ optim/total_grad_norm=1.227
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,455,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7581/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,455,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7582/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,455,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7583/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,455,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7584/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,456,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7585/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,456,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7586/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,456,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7587/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,456,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7588/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,456,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7589/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,457,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7590/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,457,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7591/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,457,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7592/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,457,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7593/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,457,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7594/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,458,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7595/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,458,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7596/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,458,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7597/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,458,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7598/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,458,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7599/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,459,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7600/500000]
+ optim/total_grad_norm=1.164
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,459,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7601/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,459,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7602/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,459,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7603/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,459,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7604/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,459,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7605/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,460,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7606/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,460,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7607/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,460,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7608/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,460,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7609/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,460,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7610/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,461,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7611/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,461,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7612/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,461,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7613/500000]
+ train/ActionNoiseL2Loss=0.0062
+ throughput/total_tokens=1,461,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7614/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,461,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7615/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,462,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7616/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,462,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7617/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,462,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7618/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,462,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7619/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=1,462,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7620/500000]
+ optim/total_grad_norm=1.807
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,463,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7621/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,463,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7622/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,463,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7623/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,463,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7624/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,463,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7625/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,464,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7626/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,464,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7627/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,464,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7628/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,464,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7629/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,464,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7630/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,464,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7631/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,465,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7632/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,465,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7633/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,465,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7634/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,465,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7635/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,465,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7636/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,466,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7637/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,466,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7638/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,466,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7639/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,466,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7640/500000]
+ optim/total_grad_norm=1.841
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,466,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7641/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,467,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7642/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,467,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7643/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,467,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7644/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,467,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7645/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=1,467,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7646/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,468,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7647/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,468,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7648/500000]
+ train/ActionNoiseL2Loss=0.0129
+ throughput/total_tokens=1,468,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7649/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,468,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7650/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,468,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7651/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,468,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7652/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,469,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7653/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,469,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7654/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,469,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7655/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,469,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7656/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,469,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7657/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,470,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7658/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,470,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7659/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,470,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7660/500000]
+ optim/total_grad_norm=0.8087
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,470,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7661/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,470,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7662/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,471,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7663/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,471,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7664/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,471,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7665/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,471,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7666/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,471,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7667/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,472,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7668/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,472,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7669/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,472,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7670/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,472,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7671/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,472,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7672/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,473,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7673/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,473,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7674/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,473,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7675/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,473,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7676/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,473,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7677/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,473,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7678/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,474,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7679/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,474,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7680/500000]
+ optim/total_grad_norm=0.9594
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,474,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7681/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,474,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7682/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,474,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7683/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,475,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7684/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,475,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7685/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,475,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7686/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=1,475,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7687/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,475,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7688/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,476,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7689/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,476,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7690/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,476,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7691/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,476,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7692/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,476,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7693/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,477,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7694/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,477,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7695/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,477,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7696/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,477,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7697/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,477,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7698/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,478,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7699/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,478,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7700/500000]
+ optim/total_grad_norm=2.028
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,478,400,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7701/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,478,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7702/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,478,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7703/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,478,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7704/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,479,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7705/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,479,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7706/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,479,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7707/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,479,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7708/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,479,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7709/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,480,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7710/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,480,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7711/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,480,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7712/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,480,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7713/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,480,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7714/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,481,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7715/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,481,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7716/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,481,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7717/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,481,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7718/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,481,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7719/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,482,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7720/500000]
+ optim/total_grad_norm=0.8829
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,482,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7721/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,482,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7722/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,482,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7723/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,482,816,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=7724/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,483,008,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=7725/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,483,200,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=7726/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,483,392,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=7727/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,483,584,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=7728/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,483,776,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7729/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,483,968,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7730/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,484,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7731/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,484,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7732/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,484,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7733/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,484,736,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7734/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,484,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7735/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,485,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7736/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,485,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7737/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,485,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7738/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,485,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7739/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,485,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7740/500000]
+ optim/total_grad_norm=1.460
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,486,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7741/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,486,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7742/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,486,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7743/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,486,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7744/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=1,486,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7745/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,487,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7746/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,487,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7747/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=1,487,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7748/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,487,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7749/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,487,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7750/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,488,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7751/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,488,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7752/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,488,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7753/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,488,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7754/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,488,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7755/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,488,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7756/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,489,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7757/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=1,489,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7758/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,489,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7759/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,489,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7760/500000]
+ optim/total_grad_norm=0.7359
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,489,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7761/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,490,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7762/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,490,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=7763/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,490,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7764/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,490,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7765/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,490,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7766/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,491,072,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7767/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,491,264,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7768/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,491,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7769/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,491,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7770/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,491,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7771/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,492,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7772/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,492,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7773/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,492,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7774/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,492,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7775/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,492,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7776/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,492,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7777/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,493,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7778/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,493,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7779/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,493,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7780/500000]
+ optim/total_grad_norm=1.258
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,493,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7781/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,493,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7782/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,494,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7783/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,494,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7784/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,494,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7785/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,494,720,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7786/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,494,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7787/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=1,495,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7788/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,495,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7789/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=1,495,488,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7790/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,495,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7791/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,495,872,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7792/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,496,064,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7793/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,496,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7794/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,496,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7795/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,496,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7796/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,496,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7797/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,497,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7798/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,497,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7799/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,497,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7800/500000]
+ optim/total_grad_norm=1.350
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,497,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7801/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,497,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7802/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,497,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7803/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,498,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7804/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,498,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7805/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,498,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7806/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,498,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7807/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,498,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7808/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,499,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7809/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,499,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7810/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,499,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7811/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,499,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7812/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,499,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7813/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,500,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7814/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,500,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7815/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,500,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7816/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,500,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7817/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,500,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7818/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,501,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7819/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,501,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7820/500000]
+ optim/total_grad_norm=0.9918
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,501,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7821/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=1,501,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7822/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,501,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7823/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,502,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7824/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,502,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7825/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,502,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7826/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,502,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7827/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,502,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7828/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,502,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7829/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,503,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7830/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,503,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7831/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,503,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7832/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,503,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7833/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,503,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7834/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,504,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7835/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,504,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7836/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,504,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7837/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,504,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7838/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,504,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7839/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,505,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7840/500000]
+ optim/total_grad_norm=0.9042
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,505,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7841/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,505,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7842/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,505,664,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7843/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,505,856,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7844/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,506,048,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7845/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,506,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7846/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,506,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7847/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,506,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7848/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,506,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7849/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,507,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7850/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,507,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7851/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,507,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7852/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,507,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7853/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=1,507,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7854/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,507,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7855/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,508,160,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7856/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,508,352,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7857/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,508,544,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7858/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,508,736,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=7859/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,508,928,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=7860/500000]
+ optim/total_grad_norm=2.221
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=1,509,120,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=7861/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,509,312,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=7862/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,509,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7863/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,509,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7864/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,509,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7865/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,510,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7866/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,510,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7867/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,510,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7868/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,510,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7869/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,510,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7870/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,511,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7871/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,511,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7872/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,511,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7873/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,511,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7874/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,511,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7875/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,512,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7876/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,512,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7877/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,512,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7878/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,512,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7879/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,512,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7880/500000]
+ optim/total_grad_norm=0.9962
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=1,512,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7881/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,513,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7882/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,513,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7883/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,513,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7884/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,513,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7885/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,513,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7886/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,514,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7887/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,514,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7888/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,514,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7889/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,514,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7890/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,514,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7891/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,515,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7892/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,515,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7893/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,515,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7894/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,515,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7895/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,515,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7896/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,516,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7897/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,516,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7898/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,516,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7899/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,516,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7900/500000]
+ optim/total_grad_norm=0.9190
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,516,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7901/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,516,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7902/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,517,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7903/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,517,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7904/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,517,568,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7905/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,517,760,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7906/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,517,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7907/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,518,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7908/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,518,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7909/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=1,518,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7910/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,518,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=7911/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,518,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7912/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,519,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7913/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,519,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7914/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,519,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7915/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,519,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7916/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,519,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7917/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,520,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7918/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,520,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7919/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,520,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=7920/500000]
+ optim/total_grad_norm=1.646
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,520,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7921/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,520,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7922/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,521,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7923/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,521,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7924/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,521,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7925/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,521,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7926/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,521,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7927/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,521,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7928/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,522,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7929/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,522,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7930/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,522,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7931/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,522,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7932/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,522,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7933/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,523,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7934/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,523,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7935/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,523,520,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7936/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,523,712,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7937/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,523,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7938/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,524,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7939/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,524,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7940/500000]
+ optim/total_grad_norm=0.6585
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,524,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7941/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,524,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7942/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,524,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7943/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,525,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7944/500000]
+ train/ActionNoiseL2Loss=0.0090
+ throughput/total_tokens=1,525,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7945/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,525,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7946/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,525,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7947/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,525,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7948/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,526,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7949/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,526,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=7950/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,526,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7951/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,526,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7952/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,526,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7953/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,526,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7954/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,527,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7955/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,527,360,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7956/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,527,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7957/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,527,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7958/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,527,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7959/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,528,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7960/500000]
+ optim/total_grad_norm=1.227
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,528,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7961/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,528,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7962/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,528,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7963/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,528,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=7964/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,529,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7965/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,529,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7966/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,529,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7967/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,529,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7968/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,529,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7969/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,530,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=7970/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,530,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7971/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,530,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7972/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,530,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7973/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,530,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7974/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,531,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7975/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,531,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7976/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,531,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7977/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,531,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7978/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,531,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7979/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,531,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7980/500000]
+ optim/total_grad_norm=1.122
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,532,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=7981/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,532,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7982/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,532,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7983/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,532,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7984/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,532,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7985/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,533,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7986/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,533,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7987/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,533,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7988/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,533,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7989/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,533,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7990/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,534,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=7991/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,534,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7992/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,534,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=7993/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,534,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7994/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,534,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7995/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,535,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7996/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,535,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7997/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,535,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7998/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,535,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=7999/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,535,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8000/500000]
+ optim/total_grad_norm=1.255
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,536,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/26 [08:27:54] INFO | >> Saving config... checkpoint.py:608
+09/26 [08:28:31] INFO | >> Saving model state... checkpoint.py:796
+09/26 [08:29:32] INFO | >> Saving optim state... checkpoint.py:811
+09/26 [08:29:37] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8001/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,536,192,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=8002/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,536,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8003/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,536,576,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=8004/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,536,768,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=8005/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,536,960,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=8006/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,537,152,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=8007/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,537,344,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=8008/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,537,536,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=8009/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,537,728,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=8010/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,537,920,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+ System/Peak GPU Memory (MB)=44,437
+[step=8011/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,538,112,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=8012/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,538,304,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=8013/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,538,496,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=8014/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,538,688,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=8015/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,538,880,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=8016/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,539,072,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=8017/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,539,264,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=8018/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,539,456,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8019/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,539,648,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8020/500000]
+ optim/total_grad_norm=1.603
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,539,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8021/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,540,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8022/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,540,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8023/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,540,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8024/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,540,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8025/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,540,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8026/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,540,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8027/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,541,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8028/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,541,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8029/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,541,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8030/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,541,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8031/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,541,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8032/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,542,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8033/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,542,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8034/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,542,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8035/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,542,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8036/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,542,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8037/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,543,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8038/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,543,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8039/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,543,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8040/500000]
+ optim/total_grad_norm=1.187
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,543,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8041/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,543,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8042/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,544,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8043/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,544,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8044/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,544,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8045/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,544,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8046/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,544,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8047/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,545,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8048/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,545,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8049/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,545,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8050/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,545,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8051/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,545,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8052/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,545,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8053/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,546,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8054/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,546,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8055/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,546,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8056/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,546,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8057/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,546,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8058/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,547,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8059/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,547,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8060/500000]
+ optim/total_grad_norm=1.109
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,547,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=8061/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,547,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8062/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,547,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8063/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,548,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8064/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,548,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8065/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,548,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8066/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,548,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8067/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,548,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8068/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,549,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8069/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,549,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8070/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,549,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8071/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,549,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8072/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,549,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8073/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,550,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8074/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,550,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8075/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=1,550,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8076/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,550,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8077/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,550,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8078/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,550,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8079/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,551,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8080/500000]
+ optim/total_grad_norm=1.387
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,551,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8081/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,551,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8082/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=1,551,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8083/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,551,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8084/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,552,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8085/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,552,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8086/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=1,552,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8087/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,552,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8088/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,552,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8089/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,553,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8090/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,553,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8091/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,553,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8092/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,553,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8093/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,553,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8094/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,554,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8095/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,554,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8096/500000]
+ train/ActionNoiseL2Loss=0.0129
+ throughput/total_tokens=1,554,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8097/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,554,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8098/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,554,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8099/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,555,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8100/500000]
+ optim/total_grad_norm=0.8058
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,555,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8101/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,555,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8102/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,555,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8103/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,555,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8104/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,555,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8105/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,556,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8106/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,556,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8107/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,556,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8108/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,556,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8109/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,556,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8110/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,557,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=8111/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,557,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8112/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,557,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8113/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,557,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8114/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,557,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8115/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,558,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8116/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=1,558,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8117/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,558,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8118/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,558,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8119/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,558,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8120/500000]
+ optim/total_grad_norm=1.048
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,559,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8121/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,559,232,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8122/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,559,424,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8123/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,559,616,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8124/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,559,808,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8125/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,560,000,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8126/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,560,192,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8127/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,560,384,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8128/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,560,576,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8129/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,560,768,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8130/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,560,960,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8131/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,561,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8132/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,561,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8133/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,561,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8134/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,561,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8135/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,561,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8136/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,562,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8137/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,562,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8138/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,562,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8139/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,562,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8140/500000]
+ optim/total_grad_norm=0.9371
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,562,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8141/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,563,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8142/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,563,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8143/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,563,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8144/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,563,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8145/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,563,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8146/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,564,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8147/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,564,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8148/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,564,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8149/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,564,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8150/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,564,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8151/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,564,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8152/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,565,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8153/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,565,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8154/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,565,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8155/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,565,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8156/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,565,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8157/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,566,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8158/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,566,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8159/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,566,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8160/500000]
+ optim/total_grad_norm=1.504
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=1,566,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8161/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,566,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8162/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=1,567,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8163/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,567,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8164/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,567,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8165/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,567,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8166/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,567,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8167/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,568,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8168/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,568,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8169/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,568,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8170/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,568,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8171/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,568,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8172/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,569,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8173/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,569,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8174/500000]
+ train/ActionNoiseL2Loss=0.0122
+ throughput/total_tokens=1,569,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8175/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,569,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8176/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,569,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8177/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,569,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8178/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,570,176,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8179/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,570,368,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8180/500000]
+ optim/total_grad_norm=1.639
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,570,560,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8181/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,570,752,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8182/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,570,944,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8183/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,571,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8184/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=1,571,328,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8185/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,571,520,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8186/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,571,712,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8187/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,571,904,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8188/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,572,096,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8189/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,572,288,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8190/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,572,480,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8191/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,572,672,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8192/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,572,864,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8193/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,573,056,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8194/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,573,248,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8195/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,573,440,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8196/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,573,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8197/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,573,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8198/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,574,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8199/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,574,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8200/500000]
+ optim/total_grad_norm=0.8213
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,574,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8201/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,574,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8202/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,574,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8203/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,574,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8204/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,575,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8205/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,575,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8206/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,575,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8207/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,575,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8208/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=1,575,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8209/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,576,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8210/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,576,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=8211/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,576,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8212/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=1,576,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8213/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,576,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8214/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,577,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8215/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,577,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8216/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,577,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8217/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,577,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8218/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,577,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8219/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,578,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8220/500000]
+ optim/total_grad_norm=1.174
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,578,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8221/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,578,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8222/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,578,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8223/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,578,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8224/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=1,579,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8225/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,579,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8226/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,579,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8227/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,579,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8228/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,579,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8229/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,579,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8230/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,580,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8231/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,580,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8232/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,580,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8233/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,580,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8234/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,580,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8235/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,581,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8236/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,581,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8237/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=1,581,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8238/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,581,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8239/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,581,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8240/500000]
+ optim/total_grad_norm=1.234
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,582,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8241/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,582,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8242/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,582,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8243/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,582,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8244/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,582,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8245/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,583,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8246/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,583,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8247/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,583,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8248/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,583,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8249/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,583,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8250/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,584,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8251/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,584,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8252/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=1,584,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8253/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,584,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8254/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,584,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8255/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=1,584,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8256/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,585,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8257/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,585,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8258/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,585,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8259/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,585,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8260/500000]
+ optim/total_grad_norm=1.068
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,585,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=8261/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,586,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8262/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,586,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8263/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,586,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8264/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,586,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8265/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,586,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8266/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,587,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8267/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,587,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8268/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,587,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8269/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,587,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8270/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,587,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8271/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,588,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8272/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,588,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8273/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,588,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8274/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,588,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8275/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,588,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8276/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,588,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8277/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,589,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8278/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,589,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8279/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,589,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8280/500000]
+ optim/total_grad_norm=0.6690
+ train/ActionNoiseL2Loss=0.0093
+ throughput/total_tokens=1,589,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8281/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,589,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8282/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,590,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8283/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,590,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8284/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,590,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8285/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,590,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8286/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,590,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8287/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,591,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8288/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,591,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8289/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,591,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8290/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,591,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8291/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,591,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8292/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,592,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8293/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,592,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8294/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,592,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8295/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,592,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8296/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,592,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8297/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,593,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8298/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,593,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8299/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,593,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8300/500000]
+ optim/total_grad_norm=0.8496
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,593,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8301/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,593,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8302/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,593,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8303/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,594,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8304/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,594,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8305/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,594,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8306/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,594,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8307/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,594,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8308/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,595,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8309/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,595,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8310/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,595,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8311/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,595,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8312/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,595,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8313/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,596,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8314/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,596,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8315/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,596,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8316/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,596,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8317/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,596,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8318/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,597,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8319/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,597,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8320/500000]
+ optim/total_grad_norm=1.124
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,597,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8321/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,597,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8322/500000]
+ train/ActionNoiseL2Loss=0.0090
+ throughput/total_tokens=1,597,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8323/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,598,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8324/500000]
+ train/ActionNoiseL2Loss=0.0110
+ throughput/total_tokens=1,598,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8325/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,598,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8326/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,598,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8327/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,598,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8328/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,598,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8329/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,599,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8330/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,599,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8331/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,599,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8332/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,599,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8333/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,599,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8334/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,600,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8335/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,600,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8336/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,600,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8337/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,600,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8338/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,600,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8339/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,601,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8340/500000]
+ optim/total_grad_norm=0.5717
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,601,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8341/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,601,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8342/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,601,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8343/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,601,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8344/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,602,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8345/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=1,602,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8346/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,602,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8347/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,602,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8348/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,602,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8349/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,603,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8350/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,603,200,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8351/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,603,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8352/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,603,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8353/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,603,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8354/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,603,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8355/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,604,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8356/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,604,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8357/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,604,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8358/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,604,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8359/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,604,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8360/500000]
+ optim/total_grad_norm=1.552
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,605,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8361/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,605,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8362/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,605,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8363/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,605,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8364/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,605,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8365/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,606,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8366/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,606,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8367/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,606,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8368/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,606,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8369/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,606,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8370/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,607,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8371/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,607,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8372/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,607,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8373/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,607,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8374/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,607,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8375/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,608,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8376/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,608,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8377/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,608,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8378/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,608,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8379/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,608,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8380/500000]
+ optim/total_grad_norm=1.402
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,608,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8381/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,609,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8382/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,609,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8383/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,609,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8384/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,609,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8385/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,609,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8386/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,610,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8387/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,610,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8388/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,610,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8389/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,610,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8390/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=1,610,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8391/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,611,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8392/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,611,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8393/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,611,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8394/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,611,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8395/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,611,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8396/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,612,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8397/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,612,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8398/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,612,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8399/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,612,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8400/500000]
+ optim/total_grad_norm=1.362
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,612,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8401/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,612,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8402/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,613,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8403/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,613,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8404/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,613,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8405/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,613,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8406/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,613,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8407/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,614,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8408/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,614,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8409/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=1,614,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8410/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,614,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8411/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,614,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8412/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,615,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8413/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,615,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8414/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,615,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8415/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,615,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8416/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,615,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8417/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,616,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8418/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,616,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8419/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,616,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8420/500000]
+ optim/total_grad_norm=0.9890
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,616,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8421/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,616,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8422/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,617,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8423/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,617,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8424/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,617,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8425/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,617,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8426/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,617,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8427/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,617,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8428/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,618,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8429/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,618,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8430/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,618,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8431/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,618,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8432/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,618,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8433/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,619,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8434/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,619,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8435/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,619,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8436/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,619,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8437/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,619,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8438/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,620,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8439/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,620,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8440/500000]
+ optim/total_grad_norm=1.452
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,620,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8441/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,620,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8442/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,620,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8443/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,621,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8444/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,621,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8445/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,621,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8446/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,621,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8447/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,621,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8448/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,622,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8449/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,622,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8450/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,622,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8451/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,622,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8452/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,622,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8453/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=1,622,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8454/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,623,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8455/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,623,360,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8456/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,623,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8457/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,623,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8458/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,623,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8459/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,624,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8460/500000]
+ optim/total_grad_norm=1.001
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,624,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8461/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,624,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8462/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,624,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8463/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,624,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8464/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,625,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8465/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,625,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8466/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,625,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8467/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,625,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8468/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,625,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8469/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,626,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8470/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,626,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8471/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,626,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8472/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,626,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8473/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,626,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8474/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=1,627,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8475/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,627,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8476/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,627,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8477/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,627,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8478/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,627,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8479/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,627,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8480/500000]
+ optim/total_grad_norm=1.195
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,628,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8481/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,628,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8482/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,628,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8483/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,628,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8484/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,628,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8485/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,629,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8486/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,629,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8487/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,629,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8488/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,629,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8489/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,629,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8490/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,630,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8491/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,630,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8492/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,630,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8493/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,630,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8494/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,630,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8495/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,631,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8496/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,631,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8497/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,631,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8498/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,631,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8499/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,631,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8500/500000]
+ optim/total_grad_norm=1.157
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,632,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/26 [11:28:01] INFO | >> Saving config... checkpoint.py:608
+09/26 [11:28:38] INFO | >> Saving model state... checkpoint.py:796
+09/26 [11:29:39] INFO | >> Saving optim state... checkpoint.py:811
+09/26 [11:29:44] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8501/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,632,192,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=8502/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,632,384,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=8503/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,632,576,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=8504/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,632,768,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8505/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,632,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8506/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,633,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8507/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,633,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8508/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,633,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8509/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,633,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8510/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,633,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8511/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,634,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8512/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,634,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8513/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,634,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8514/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,634,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8515/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,634,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8516/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,635,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8517/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,635,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8518/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,635,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8519/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,635,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8520/500000]
+ optim/total_grad_norm=1.275
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,635,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8521/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,636,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8522/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,636,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8523/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,636,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8524/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,636,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8525/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=1,636,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8526/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,636,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8527/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,637,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8528/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,637,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8529/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,637,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8530/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,637,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8531/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,637,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8532/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,638,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8533/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,638,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8534/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,638,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8535/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,638,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8536/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,638,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8537/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,639,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8538/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,639,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8539/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,639,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8540/500000]
+ optim/total_grad_norm=0.8440
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,639,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8541/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,639,872,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8542/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,640,064,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8543/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,640,256,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8544/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,640,448,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8545/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,640,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8546/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,640,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8547/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,641,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8548/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,641,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8549/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,641,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8550/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,641,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8551/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,641,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8552/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,641,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8553/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,642,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8554/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,642,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8555/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,642,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8556/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,642,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8557/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,642,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8558/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,643,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8559/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,643,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8560/500000]
+ optim/total_grad_norm=1.163
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,643,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8561/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,643,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8562/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,643,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8563/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,644,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8564/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,644,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8565/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,644,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8566/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,644,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8567/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,644,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8568/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,645,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8569/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,645,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8570/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,645,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8571/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,645,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8572/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,645,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8573/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,646,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8574/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,646,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8575/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,646,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8576/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,646,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8577/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,646,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8578/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,646,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8579/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,647,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8580/500000]
+ optim/total_grad_norm=1.304
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,647,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8581/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,647,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8582/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,647,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8583/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,647,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8584/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,648,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8585/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,648,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8586/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,648,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8587/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,648,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8588/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,648,896,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8589/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,649,088,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8590/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,649,280,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8591/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,649,472,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8592/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,649,664,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8593/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,649,856,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8594/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,650,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8595/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,650,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8596/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,650,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8597/500000]
+ train/ActionNoiseL2Loss=0.0069
+ throughput/total_tokens=1,650,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8598/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,650,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8599/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,651,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8600/500000]
+ optim/total_grad_norm=2.256
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,651,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8601/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,651,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8602/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,651,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8603/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,651,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8604/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,651,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8605/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,652,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8606/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,652,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8607/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,652,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8608/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,652,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8609/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,652,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8610/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,653,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8611/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,653,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8612/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,653,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8613/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,653,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8614/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,653,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8615/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,654,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8616/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,654,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8617/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,654,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8618/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,654,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8619/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,654,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8620/500000]
+ optim/total_grad_norm=0.7794
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,655,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8621/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,655,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8622/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,655,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8623/500000]
+ train/ActionNoiseL2Loss=0.0119
+ throughput/total_tokens=1,655,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8624/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,655,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8625/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,656,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8626/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,656,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8627/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,656,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8628/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,656,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8629/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,656,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8630/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,656,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8631/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,657,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8632/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,657,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8633/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,657,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8634/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,657,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8635/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,657,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8636/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,658,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8637/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,658,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8638/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,658,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8639/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,658,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8640/500000]
+ optim/total_grad_norm=1.281
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,658,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8641/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=1,659,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8642/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,659,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8643/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,659,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8644/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,659,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8645/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=1,659,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8646/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,660,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8647/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,660,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8648/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,660,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8649/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,660,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8650/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,660,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8651/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,660,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8652/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,661,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8653/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,661,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8654/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,661,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8655/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,661,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8656/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,661,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8657/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,662,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8658/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,662,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8659/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,662,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8660/500000]
+ optim/total_grad_norm=1.380
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,662,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8661/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,662,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8662/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,663,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8663/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,663,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8664/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,663,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8665/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,663,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8666/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,663,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8667/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,664,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8668/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,664,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8669/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,664,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8670/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,664,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8671/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=1,664,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8672/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,665,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8673/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,665,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8674/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,665,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8675/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,665,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8676/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,665,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8677/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,665,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8678/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,666,176,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8679/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,666,368,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8680/500000]
+ optim/total_grad_norm=0.8177
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,666,560,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8681/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,666,752,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8682/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,666,944,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8683/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,667,136,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8684/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,667,328,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8685/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,667,520,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8686/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,667,712,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8687/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,667,904,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8688/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,668,096,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8689/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,668,288,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8690/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,668,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8691/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,668,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8692/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,668,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8693/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,669,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8694/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,669,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8695/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,669,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8696/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,669,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8697/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,669,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8698/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,670,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8699/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,670,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8700/500000]
+ optim/total_grad_norm=1.328
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,670,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8701/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,670,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8702/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,670,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8703/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,670,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8704/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,671,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8705/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,671,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8706/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,671,552,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8707/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,671,744,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8708/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,671,936,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8709/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,672,128,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8710/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,672,320,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=8711/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,672,512,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8712/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,672,704,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8713/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,672,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8714/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,673,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8715/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,673,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8716/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,673,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8717/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,673,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8718/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,673,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8719/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=1,674,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8720/500000]
+ optim/total_grad_norm=1.075
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,674,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8721/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,674,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8722/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,674,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8723/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,674,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8724/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,675,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8725/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,675,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8726/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,675,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8727/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,675,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8728/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,675,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8729/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=1,675,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8730/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=1,676,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8731/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,676,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8732/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,676,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8733/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,676,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8734/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,676,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8735/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,677,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8736/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,677,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8737/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,677,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8738/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,677,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8739/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,677,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8740/500000]
+ optim/total_grad_norm=1.606
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,678,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8741/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,678,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8742/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,678,464,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8743/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,678,656,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8744/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,678,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8745/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,679,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8746/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,679,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8747/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,679,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8748/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,679,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8749/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,679,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8750/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,680,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8751/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,680,192,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8752/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,680,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8753/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,680,576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8754/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,680,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8755/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,680,960,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8756/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,681,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8757/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,681,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8758/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,681,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8759/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,681,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8760/500000]
+ optim/total_grad_norm=0.8095
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,681,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=8761/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,682,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8762/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,682,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8763/500000]
+ train/ActionNoiseL2Loss=0.0122
+ throughput/total_tokens=1,682,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8764/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,682,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8765/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,682,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8766/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,683,072,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8767/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,683,264,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8768/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,683,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8769/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,683,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8770/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,683,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8771/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,684,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8772/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,684,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8773/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,684,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8774/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,684,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8775/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,684,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8776/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,684,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8777/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,685,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8778/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,685,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8779/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,685,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8780/500000]
+ optim/total_grad_norm=1.339
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,685,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8781/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,685,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8782/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,686,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8783/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,686,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8784/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,686,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8785/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,686,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8786/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,686,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8787/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,687,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8788/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,687,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8789/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,687,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8790/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,687,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8791/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,687,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8792/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,688,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8793/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,688,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8794/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,688,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8795/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,688,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8796/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,688,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8797/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,689,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8798/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,689,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8799/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,689,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8800/500000]
+ optim/total_grad_norm=1.123
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,689,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8801/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,689,792,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8802/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,689,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8803/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,690,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8804/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,690,368,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8805/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,690,560,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8806/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,690,752,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8807/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,690,944,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8808/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,691,136,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8809/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,691,328,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8810/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,691,520,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=8811/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,691,712,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8812/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=1,691,904,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8813/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,692,096,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8814/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=1,692,288,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8815/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,692,480,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8816/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,692,672,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=8817/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,692,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8818/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,693,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8819/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,693,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8820/500000]
+ optim/total_grad_norm=1.151
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,693,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8821/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,693,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8822/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,693,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8823/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,694,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8824/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,694,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8825/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,694,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8826/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,694,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8827/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,694,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8828/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,694,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8829/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,695,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8830/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,695,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8831/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,695,552,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8832/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=1,695,744,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8833/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,695,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8834/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,696,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8835/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=1,696,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8836/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,696,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8837/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,696,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8838/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,696,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8839/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,697,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8840/500000]
+ optim/total_grad_norm=0.8321
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,697,280,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8841/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,697,472,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8842/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,697,664,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8843/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,697,856,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8844/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,698,048,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8845/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,698,240,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8846/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,698,432,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8847/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,698,624,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8848/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,698,816,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8849/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,699,008,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8850/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,699,200,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8851/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,699,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8852/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,699,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8853/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,699,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8854/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,699,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8855/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,700,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8856/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,700,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8857/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=1,700,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8858/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,700,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8859/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,700,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8860/500000]
+ optim/total_grad_norm=1.049
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,701,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=8861/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,701,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8862/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,701,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8863/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,701,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8864/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,701,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8865/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,702,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8866/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,702,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8867/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,702,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8868/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,702,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8869/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,702,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=8870/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,703,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8871/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,703,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8872/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,703,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8873/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,703,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8874/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=1,703,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8875/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,704,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8876/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,704,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8877/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,704,384,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8878/500000]
+ train/ActionNoiseL2Loss=0.0106
+ throughput/total_tokens=1,704,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8879/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,704,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8880/500000]
+ optim/total_grad_norm=1.094
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,704,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8881/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,705,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8882/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,705,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8883/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,705,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8884/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,705,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8885/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,705,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8886/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,706,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8887/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,706,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8888/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,706,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8889/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,706,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8890/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,706,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8891/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,707,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8892/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,707,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8893/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,707,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8894/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,707,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8895/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,707,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8896/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,708,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8897/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,708,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8898/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,708,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8899/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,708,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8900/500000]
+ optim/total_grad_norm=1.274
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,708,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8901/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,708,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8902/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,709,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8903/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,709,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8904/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,709,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8905/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,709,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8906/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,709,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8907/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,710,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8908/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,710,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8909/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,710,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8910/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,710,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8911/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,710,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8912/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,711,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8913/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,711,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8914/500000]
+ train/ActionNoiseL2Loss=0.0097
+ throughput/total_tokens=1,711,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8915/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,711,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8916/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,711,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8917/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,712,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8918/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,712,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8919/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,712,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8920/500000]
+ optim/total_grad_norm=0.6914
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,712,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8921/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,712,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8922/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,713,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8923/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,713,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8924/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,713,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8925/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,713,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8926/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,713,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8927/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,713,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8928/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,714,176,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8929/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,714,368,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8930/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,714,560,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8931/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,714,752,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8932/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,714,944,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8933/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,715,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8934/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,715,328,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8935/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,715,520,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8936/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,715,712,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8937/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,715,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8938/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,716,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8939/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,716,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8940/500000]
+ optim/total_grad_norm=0.9612
+ train/ActionNoiseL2Loss=0.0102
+ throughput/total_tokens=1,716,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8941/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,716,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8942/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,716,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8943/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,717,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8944/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,717,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8945/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,717,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8946/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,717,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8947/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,717,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8948/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,718,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8949/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,718,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8950/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,718,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8951/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,718,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8952/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,718,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8953/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,718,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8954/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,719,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8955/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,719,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8956/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,719,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8957/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,719,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8958/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,719,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8959/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,720,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8960/500000]
+ optim/total_grad_norm=1.199
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,720,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8961/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=1,720,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8962/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,720,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=8963/500000]
+ train/ActionNoiseL2Loss=0.0119
+ throughput/total_tokens=1,720,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8964/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,721,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=8965/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,721,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8966/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,721,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8967/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,721,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8968/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,721,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8969/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,722,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8970/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,722,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8971/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,722,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8972/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,722,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8973/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,722,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8974/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,723,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8975/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,723,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8976/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,723,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8977/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,723,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8978/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,723,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8979/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,723,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8980/500000]
+ optim/total_grad_norm=1.002
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,724,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=8981/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,724,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8982/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,724,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8983/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=1,724,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8984/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,724,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8985/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,725,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8986/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,725,312,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8987/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,725,504,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8988/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,725,696,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8989/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=1,725,888,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8990/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,726,080,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=8991/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,726,272,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8992/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,726,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8993/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,726,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8994/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,726,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8995/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,727,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8996/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,727,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8997/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,727,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8998/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=1,727,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=8999/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,727,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9000/500000]
+ optim/total_grad_norm=1.345
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,728,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/26 [14:28:13] INFO | >> Saving config... checkpoint.py:608
+09/26 [14:28:43] INFO | >> Saving model state... checkpoint.py:796
+09/26 [14:29:45] INFO | >> Saving optim state... checkpoint.py:811
+09/26 [14:29:50] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9001/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,728,192,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=9002/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,728,384,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=9003/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,728,576,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=9004/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,728,768,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=9005/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,728,960,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=9006/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,729,152,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=9007/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,729,344,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9008/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,729,536,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9009/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,729,728,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9010/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,729,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9011/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,730,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9012/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,730,304,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9013/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,730,496,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9014/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,730,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9015/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,730,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9016/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,731,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9017/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,731,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9018/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,731,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9019/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,731,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9020/500000]
+ optim/total_grad_norm=0.8902
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,731,840,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9021/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,732,032,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9022/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,732,224,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9023/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=1,732,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9024/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,732,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9025/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=1,732,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9026/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,732,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9027/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,733,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9028/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,733,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9029/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,733,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9030/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,733,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9031/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,733,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9032/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,734,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9033/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,734,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9034/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,734,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9035/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,734,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9036/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,734,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9037/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,735,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9038/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,735,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9039/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,735,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9040/500000]
+ optim/total_grad_norm=0.9300
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,735,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9041/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,735,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9042/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,736,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9043/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=1,736,256,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9044/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,736,448,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9045/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,736,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9046/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,736,832,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9047/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=1,737,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9048/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,737,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9049/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,737,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9050/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,737,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9051/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=1,737,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9052/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,737,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9053/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,738,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9054/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,738,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9055/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,738,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9056/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,738,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9057/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,738,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9058/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,739,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9059/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,739,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9060/500000]
+ optim/total_grad_norm=1.322
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,739,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9061/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,739,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9062/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,739,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9063/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,740,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9064/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,740,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9065/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,740,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9066/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,740,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9067/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,740,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9068/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,741,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9069/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,741,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9070/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,741,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9071/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,741,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9072/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,741,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9073/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,742,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9074/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,742,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9075/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,742,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9076/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=1,742,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9077/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,742,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9078/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,742,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9079/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,743,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9080/500000]
+ optim/total_grad_norm=1.108
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,743,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9081/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,743,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9082/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,743,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9083/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,743,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9084/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,744,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9085/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,744,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9086/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,744,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9087/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,744,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9088/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,744,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9089/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,745,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9090/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,745,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9091/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,745,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9092/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,745,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9093/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,745,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9094/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,746,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9095/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,746,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9096/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,746,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9097/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,746,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9098/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,746,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9099/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,747,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9100/500000]
+ optim/total_grad_norm=0.8384
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,747,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9101/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,747,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9102/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,747,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9103/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,747,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9104/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,747,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9105/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,748,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9106/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=1,748,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9107/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,748,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9108/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,748,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9109/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,748,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9110/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,749,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9111/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,749,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9112/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,749,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9113/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,749,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9114/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,749,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9115/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,750,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9116/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,750,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9117/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,750,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9118/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,750,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9119/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,750,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9120/500000]
+ optim/total_grad_norm=1.304
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,751,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9121/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,751,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9122/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,751,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9123/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,751,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9124/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=1,751,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9125/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,752,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9126/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,752,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9127/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,752,384,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9128/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,752,576,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9129/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,752,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9130/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,752,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9131/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,753,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9132/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,753,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9133/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,753,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9134/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,753,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9135/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,753,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9136/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,754,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9137/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,754,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9138/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,754,496,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9139/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,754,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9140/500000]
+ optim/total_grad_norm=1.519
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,754,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9141/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,755,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9142/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=1,755,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9143/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,755,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9144/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,755,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9145/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,755,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9146/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,756,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9147/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,756,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9148/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,756,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9149/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,756,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9150/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,756,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9151/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,756,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9152/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,757,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9153/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,757,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9154/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,757,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9155/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,757,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9156/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,757,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9157/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,758,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9158/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,758,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9159/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,758,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9160/500000]
+ optim/total_grad_norm=1.262
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,758,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9161/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,758,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9162/500000]
+ train/ActionNoiseL2Loss=0.0098
+ throughput/total_tokens=1,759,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9163/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,759,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9164/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,759,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9165/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,759,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9166/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,759,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9167/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,760,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9168/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,760,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9169/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,760,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9170/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,760,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9171/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,760,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9172/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,761,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9173/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,761,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9174/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,761,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9175/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,761,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9176/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,761,792,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9177/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,761,984,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9178/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,762,176,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9179/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,762,368,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9180/500000]
+ optim/total_grad_norm=0.8262
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,762,560,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9181/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,762,752,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9182/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,762,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9183/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,763,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9184/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,763,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9185/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,763,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9186/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,763,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9187/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,763,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9188/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,764,096,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9189/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,764,288,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9190/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,764,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9191/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,764,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9192/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,764,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9193/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,765,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9194/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,765,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9195/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,765,440,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9196/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,765,632,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9197/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,765,824,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9198/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,766,016,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9199/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,766,208,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9200/500000]
+ optim/total_grad_norm=1.754
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,766,400,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9201/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,766,592,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9202/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,766,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9203/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,766,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9204/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,767,168,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9205/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,767,360,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9206/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,767,552,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9207/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,767,744,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9208/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,767,936,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9209/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,768,128,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9210/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,768,320,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9211/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,768,512,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9212/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,768,704,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9213/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,768,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9214/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,769,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9215/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,769,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9216/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,769,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9217/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,769,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9218/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,769,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9219/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,770,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9220/500000]
+ optim/total_grad_norm=0.6514
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,770,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9221/500000]
+ train/ActionNoiseL2Loss=0.0090
+ throughput/total_tokens=1,770,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9222/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,770,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9223/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,770,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9224/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,771,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9225/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,771,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9226/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,771,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9227/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,771,584,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9228/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,771,776,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9229/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,771,968,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9230/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=1,772,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9231/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,772,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9232/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,772,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9233/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,772,736,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9234/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,772,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9235/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,773,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9236/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,773,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9237/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,773,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9238/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,773,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9239/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,773,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9240/500000]
+ optim/total_grad_norm=1.431
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,774,080,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9241/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,774,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9242/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,774,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9243/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,774,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9244/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,774,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9245/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,775,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9246/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,775,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9247/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,775,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9248/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=1,775,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9249/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,775,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9250/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=1,776,000,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9251/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,776,192,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9252/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,776,384,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9253/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,776,576,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9254/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,776,768,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9255/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,776,960,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9256/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,777,152,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9257/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,777,344,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9258/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,777,536,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9259/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,777,728,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9260/500000]
+ optim/total_grad_norm=1.035
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,777,920,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=9261/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,778,112,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9262/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,778,304,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9263/500000]
+ train/ActionNoiseL2Loss=0.0100
+ throughput/total_tokens=1,778,496,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9264/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,778,688,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9265/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,778,880,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9266/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,779,072,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9267/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,779,264,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9268/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,779,456,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9269/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,779,648,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9270/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,779,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9271/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=1,780,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9272/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,780,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9273/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,780,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9274/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,780,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9275/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,780,800,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9276/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,780,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9277/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,781,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9278/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,781,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9279/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,781,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9280/500000]
+ optim/total_grad_norm=0.8521
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,781,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9281/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,781,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9282/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,782,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9283/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,782,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9284/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,782,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9285/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,782,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9286/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,782,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9287/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,783,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9288/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,783,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9289/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,783,488,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9290/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,783,680,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9291/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=1,783,872,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9292/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,784,064,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9293/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,784,256,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9294/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,784,448,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9295/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,784,640,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9296/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,784,832,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9297/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,785,024,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9298/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,785,216,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9299/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,785,408,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9300/500000]
+ optim/total_grad_norm=1.188
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,785,600,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9301/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,785,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9302/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,785,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9303/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,786,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9304/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,786,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9305/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,786,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9306/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,786,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9307/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,786,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9308/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,787,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9309/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,787,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9310/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,787,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9311/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,787,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9312/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,787,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9313/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,788,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9314/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,788,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9315/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,788,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9316/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,788,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9317/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,788,864,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9318/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,789,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9319/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,789,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9320/500000]
+ optim/total_grad_norm=1.231
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,789,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9321/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,789,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9322/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,789,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9323/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,790,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9324/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,790,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9325/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,790,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9326/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,790,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9327/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,790,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9328/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,790,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9329/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,791,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9330/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,791,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9331/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,791,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9332/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,791,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9333/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,791,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9334/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,792,128,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9335/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,792,320,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9336/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=1,792,512,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9337/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,792,704,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9338/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,792,896,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9339/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,793,088,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9340/500000]
+ optim/total_grad_norm=1.177
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,793,280,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9341/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,793,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9342/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,793,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9343/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,793,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9344/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,794,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9345/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,794,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9346/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,794,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9347/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,794,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9348/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,794,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9349/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,795,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9350/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,795,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9351/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,795,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9352/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,795,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9353/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,795,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9354/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,795,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9355/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,796,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9356/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,796,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9357/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,796,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9358/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,796,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9359/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,796,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9360/500000]
+ optim/total_grad_norm=1.269
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,797,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9361/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,797,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9362/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,797,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9363/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,797,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9364/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,797,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9365/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,798,080,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9366/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,798,272,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9367/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,798,464,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9368/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,798,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9369/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,798,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9370/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,799,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9371/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=1,799,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9372/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,799,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9373/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,799,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9374/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,799,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9375/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,800,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9376/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,800,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9377/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,800,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9378/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,800,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9379/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,800,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9380/500000]
+ optim/total_grad_norm=0.9659
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,800,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9381/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,801,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9382/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,801,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9383/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,801,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9384/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,801,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9385/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,801,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9386/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,802,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9387/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,802,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9388/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,802,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9389/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,802,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9390/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,802,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9391/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,803,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9392/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,803,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9393/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,803,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9394/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,803,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9395/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,803,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9396/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,804,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9397/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,804,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9398/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,804,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9399/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,804,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9400/500000]
+ optim/total_grad_norm=0.7565
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,804,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9401/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,804,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9402/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,805,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9403/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,805,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9404/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,805,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9405/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,805,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9406/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,805,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9407/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,806,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9408/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,806,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9409/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,806,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9410/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,806,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9411/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,806,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9412/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,807,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9413/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,807,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9414/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,807,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9415/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,807,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9416/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,807,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9417/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,808,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9418/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,808,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9419/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,808,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9420/500000]
+ optim/total_grad_norm=1.089
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,808,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9421/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,808,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9422/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,809,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9423/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,809,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9424/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,809,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9425/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,809,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9426/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,809,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9427/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,809,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9428/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,810,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9429/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,810,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9430/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,810,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9431/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,810,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9432/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=1,810,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9433/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,811,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9434/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,811,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9435/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,811,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9436/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,811,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9437/500000]
+ train/ActionNoiseL2Loss=0.0071
+ throughput/total_tokens=1,811,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9438/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,812,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9439/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,812,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9440/500000]
+ optim/total_grad_norm=1.236
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,812,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9441/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,812,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9442/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,812,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9443/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,813,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9444/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,813,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9445/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=1,813,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9446/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,813,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9447/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,813,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9448/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,814,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9449/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,814,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9450/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=1,814,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9451/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,814,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9452/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,814,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9453/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,814,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9454/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,815,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9455/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,815,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9456/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,815,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9457/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,815,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9458/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,815,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9459/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,816,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9460/500000]
+ optim/total_grad_norm=1.261
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,816,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9461/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,816,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9462/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,816,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9463/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,816,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9464/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,817,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9465/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,817,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9466/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,817,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9467/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,817,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9468/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,817,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9469/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,818,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9470/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,818,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9471/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,818,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9472/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,818,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9473/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,818,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9474/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,819,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9475/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,819,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9476/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,819,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9477/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,819,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9478/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,819,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9479/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,819,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9480/500000]
+ optim/total_grad_norm=1.488
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,820,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9481/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,820,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9482/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,820,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9483/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,820,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9484/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,820,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9485/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,821,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9486/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,821,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9487/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,821,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9488/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,821,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9489/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,821,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9490/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,822,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9491/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,822,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9492/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,822,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9493/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,822,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9494/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,822,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9495/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,823,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9496/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,823,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9497/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,823,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9498/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,823,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9499/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,823,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9500/500000]
+ optim/total_grad_norm=0.9528
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,824,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/26 [17:28:22] INFO | >> Saving config... checkpoint.py:608
+09/26 [17:28:53] INFO | >> Saving model state... checkpoint.py:796
+09/26 [17:29:52] INFO | >> Saving optim state... checkpoint.py:811
+09/26 [17:29:57] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9501/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,824,192,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=9502/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,824,384,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=9503/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,824,576,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=9504/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,824,768,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=9505/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,824,960,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=9506/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,825,152,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=9507/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,825,344,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=9508/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,825,536,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9509/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,825,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9510/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,825,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9511/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,826,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9512/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,826,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9513/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,826,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9514/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,826,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9515/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,826,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9516/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,827,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9517/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,827,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9518/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,827,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9519/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,827,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9520/500000]
+ optim/total_grad_norm=1.443
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,827,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9521/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,828,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9522/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,828,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9523/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,828,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9524/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,828,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9525/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,828,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9526/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,828,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9527/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,829,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9528/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,829,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9529/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,829,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9530/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,829,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9531/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,829,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9532/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,830,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9533/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,830,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9534/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,830,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9535/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,830,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9536/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,830,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9537/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,831,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9538/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,831,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9539/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,831,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9540/500000]
+ optim/total_grad_norm=0.9135
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,831,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9541/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,831,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9542/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,832,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9543/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,832,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9544/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,832,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9545/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,832,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9546/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,832,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9547/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,833,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9548/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,833,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9549/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,833,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9550/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,833,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9551/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,833,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9552/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,833,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9553/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,834,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9554/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,834,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9555/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,834,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9556/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,834,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9557/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,834,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9558/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,835,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9559/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,835,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9560/500000]
+ optim/total_grad_norm=1.181
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,835,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9561/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,835,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9562/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,835,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9563/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,836,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9564/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,836,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9565/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,836,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9566/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,836,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9567/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,836,864,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9568/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,837,056,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9569/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,837,248,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9570/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,837,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9571/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,837,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9572/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,837,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9573/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,838,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9574/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,838,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9575/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,838,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9576/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,838,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9577/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,838,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9578/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,838,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9579/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,839,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9580/500000]
+ optim/total_grad_norm=0.8807
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,839,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9581/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,839,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9582/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,839,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9583/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,839,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9584/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,840,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9585/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,840,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9586/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,840,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9587/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,840,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9588/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,840,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9589/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,841,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9590/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,841,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9591/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,841,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9592/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,841,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9593/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,841,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9594/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,842,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9595/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,842,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9596/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,842,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9597/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,842,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9598/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,842,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9599/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,843,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9600/500000]
+ optim/total_grad_norm=1.518
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,843,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9601/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,843,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9602/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,843,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9603/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,843,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9604/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,843,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9605/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,844,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9606/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,844,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9607/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,844,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9608/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,844,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9609/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=1,844,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9610/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,845,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9611/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,845,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9612/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,845,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9613/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,845,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9614/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,845,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9615/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,846,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9616/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,846,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9617/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,846,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9618/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,846,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9619/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,846,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9620/500000]
+ optim/total_grad_norm=0.7166
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,847,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9621/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,847,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9622/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,847,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9623/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,847,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9624/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,847,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9625/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,848,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9626/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,848,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9627/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,848,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9628/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,848,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9629/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,848,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9630/500000]
+ train/ActionNoiseL2Loss=0.0086
+ throughput/total_tokens=1,848,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9631/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,849,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9632/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,849,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9633/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,849,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9634/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,849,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9635/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,849,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9636/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,850,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9637/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,850,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9638/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,850,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9639/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,850,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9640/500000]
+ optim/total_grad_norm=2.071
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,850,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9641/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,851,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9642/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,851,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9643/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,851,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9644/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,851,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9645/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,851,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9646/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,852,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9647/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,852,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9648/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,852,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9649/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,852,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9650/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,852,800,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9651/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,852,992,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9652/500000]
+ train/ActionNoiseL2Loss=0.0103
+ throughput/total_tokens=1,853,184,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9653/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,853,376,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9654/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,853,568,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9655/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,853,760,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9656/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,853,952,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9657/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,854,144,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9658/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,854,336,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9659/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,854,528,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9660/500000]
+ optim/total_grad_norm=1.278
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,854,720,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9661/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,854,912,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9662/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,855,104,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9663/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,855,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9664/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,855,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9665/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,855,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9666/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,855,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9667/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,856,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9668/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,856,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9669/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,856,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9670/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,856,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9671/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,856,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9672/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,857,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9673/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,857,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9674/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,857,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9675/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,857,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9676/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,857,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9677/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,857,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9678/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,858,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9679/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,858,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9680/500000]
+ optim/total_grad_norm=1.748
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,858,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9681/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,858,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9682/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,858,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9683/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,859,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9684/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,859,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9685/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,859,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9686/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,859,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9687/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,859,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9688/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,860,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9689/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,860,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9690/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,860,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9691/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,860,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9692/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,860,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9693/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,861,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9694/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,861,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9695/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,861,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9696/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,861,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9697/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,861,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9698/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,862,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9699/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,862,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9700/500000]
+ optim/total_grad_norm=1.912
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,862,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9701/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,862,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9702/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,862,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9703/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,862,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9704/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,863,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9705/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,863,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9706/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,863,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9707/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,863,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9708/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,863,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9709/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,864,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9710/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,864,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9711/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,864,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9712/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=1,864,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9713/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,864,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9714/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,865,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9715/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,865,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9716/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=1,865,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9717/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,865,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9718/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,865,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9719/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,866,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9720/500000]
+ optim/total_grad_norm=1.250
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,866,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9721/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,866,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9722/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,866,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9723/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,866,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9724/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,867,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9725/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,867,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9726/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,867,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9727/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,867,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9728/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,867,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9729/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,867,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9730/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,868,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9731/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,868,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9732/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,868,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9733/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,868,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9734/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,868,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9735/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,869,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9736/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,869,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9737/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,869,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9738/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,869,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9739/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,869,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9740/500000]
+ optim/total_grad_norm=1.393
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,870,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9741/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,870,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9742/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,870,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9743/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,870,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9744/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,870,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9745/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,871,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9746/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,871,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9747/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,871,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9748/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,871,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9749/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,871,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9750/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,872,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9751/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,872,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9752/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,872,384,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9753/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=1,872,576,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9754/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,872,768,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9755/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,872,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9756/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,873,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9757/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,873,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9758/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,873,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9759/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,873,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9760/500000]
+ optim/total_grad_norm=0.9805
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,873,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9761/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,874,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9762/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,874,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9763/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,874,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9764/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,874,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9765/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,874,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9766/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,875,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9767/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=1,875,264,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9768/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,875,456,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9769/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,875,648,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9770/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,875,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9771/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,876,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9772/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,876,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9773/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,876,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9774/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,876,608,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9775/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,876,800,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9776/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,876,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9777/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,877,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9778/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,877,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9779/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,877,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9780/500000]
+ optim/total_grad_norm=0.7161
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,877,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9781/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,877,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9782/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,878,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9783/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,878,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9784/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,878,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9785/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,878,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9786/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,878,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9787/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,879,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9788/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,879,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9789/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,879,488,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9790/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,879,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9791/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,879,872,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9792/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,880,064,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9793/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,880,256,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9794/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,880,448,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9795/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,880,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9796/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,880,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9797/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,881,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9798/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,881,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9799/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,881,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9800/500000]
+ optim/total_grad_norm=0.8507
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,881,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9801/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,881,792,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9802/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,881,984,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9803/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,882,176,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9804/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,882,368,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9805/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,882,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9806/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,882,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9807/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,882,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9808/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,883,136,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9809/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,883,328,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9810/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,883,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9811/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,883,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9812/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,883,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9813/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,884,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9814/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,884,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9815/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,884,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9816/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,884,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9817/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,884,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9818/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,885,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9819/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,885,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9820/500000]
+ optim/total_grad_norm=1.080
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,885,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9821/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=1,885,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9822/500000]
+ train/ActionNoiseL2Loss=0.1257
+ throughput/total_tokens=1,885,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9823/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,886,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9824/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=1,886,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9825/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,886,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9826/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,886,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9827/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,886,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9828/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,886,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9829/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,887,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9830/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,887,360,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9831/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,887,552,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9832/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,887,744,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9833/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,887,936,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9834/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,888,128,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9835/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,888,320,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9836/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,888,512,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9837/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,888,704,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9838/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,888,896,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9839/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,889,088,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9840/500000]
+ optim/total_grad_norm=0.7297
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,889,280,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9841/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,889,472,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9842/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,889,664,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=9843/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,889,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9844/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,890,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9845/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,890,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9846/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,890,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9847/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,890,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9848/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=1,890,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9849/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,891,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9850/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,891,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9851/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,891,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9852/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,891,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9853/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,891,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9854/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,891,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9855/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,892,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9856/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,892,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9857/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,892,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9858/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,892,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9859/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,892,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9860/500000]
+ optim/total_grad_norm=1.107
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,893,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9861/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,893,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9862/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,893,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9863/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,893,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9864/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,893,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9865/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=1,894,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9866/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,894,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9867/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,894,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9868/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,894,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9869/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,894,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9870/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,895,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9871/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,895,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9872/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,895,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9873/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,895,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9874/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,895,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9875/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,896,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9876/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,896,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9877/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,896,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9878/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,896,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9879/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,896,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9880/500000]
+ optim/total_grad_norm=1.295
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,896,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=9881/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,897,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9882/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,897,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9883/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,897,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9884/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,897,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9885/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,897,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9886/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,898,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9887/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,898,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9888/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=1,898,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=9889/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,898,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9890/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,898,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9891/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,899,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9892/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,899,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9893/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,899,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9894/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,899,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9895/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,899,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9896/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,900,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9897/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,900,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9898/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,900,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9899/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,900,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9900/500000]
+ optim/total_grad_norm=0.6573
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,900,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9901/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,900,992,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9902/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,901,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9903/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,901,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9904/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,901,568,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9905/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,901,760,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9906/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,901,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9907/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,902,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9908/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,902,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9909/500000]
+ train/ActionNoiseL2Loss=0.0110
+ throughput/total_tokens=1,902,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9910/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,902,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=9911/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,902,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9912/500000]
+ train/ActionNoiseL2Loss=0.0122
+ throughput/total_tokens=1,903,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9913/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,903,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9914/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,903,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9915/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,903,680,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9916/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,903,872,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9917/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,904,064,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9918/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,904,256,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9919/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,904,448,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9920/500000]
+ optim/total_grad_norm=0.4518
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,904,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9921/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,904,832,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9922/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,905,024,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9923/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,905,216,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9924/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,905,408,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9925/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=1,905,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9926/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,905,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9927/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,905,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9928/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,906,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9929/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,906,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9930/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,906,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9931/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,906,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9932/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,906,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9933/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,907,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9934/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,907,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9935/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,907,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9936/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,907,712,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9937/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,907,904,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9938/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,908,096,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9939/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,908,288,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9940/500000]
+ optim/total_grad_norm=1.208
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,908,480,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9941/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,908,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9942/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,908,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9943/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,909,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9944/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,909,248,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9945/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,909,440,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9946/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,909,632,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9947/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,909,824,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9948/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,910,016,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9949/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,910,208,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=9950/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,910,400,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9951/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,910,592,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9952/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,910,784,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9953/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,910,976,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9954/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=1,911,168,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9955/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,911,360,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=9956/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,911,552,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9957/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,911,744,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9958/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,911,936,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9959/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,912,128,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9960/500000]
+ optim/total_grad_norm=1.211
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,912,320,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=9961/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,912,512,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=9962/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,912,704,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=9963/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,912,896,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9964/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,913,088,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9965/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,913,280,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9966/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,913,472,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9967/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,913,664,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9968/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,913,856,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9969/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,914,048,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=9970/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,914,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9971/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,914,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9972/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,914,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9973/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,914,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9974/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,915,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9975/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,915,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9976/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,915,392,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9977/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,915,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9978/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,915,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9979/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,915,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9980/500000]
+ optim/total_grad_norm=1.076
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,916,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9981/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,916,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9982/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,916,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9983/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,916,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9984/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,916,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=9985/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,917,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9986/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,917,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9987/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=1,917,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9988/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,917,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=9989/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,917,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9990/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,918,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=9991/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,918,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9992/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,918,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9993/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,918,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9994/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,918,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9995/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,919,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9996/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,919,232,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9997/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,919,424,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9998/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,919,616,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=9999/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,919,808,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10000/500000]
+ optim/total_grad_norm=0.5100
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,920,000,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/26 [20:28:28] INFO | >> Saving config... checkpoint.py:608
+09/26 [20:29:02] INFO | >> Saving model state... checkpoint.py:796
+09/26 [20:29:59] INFO | >> Saving optim state... checkpoint.py:811
+09/26 [20:30:04] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10001/500000]
+ train/ActionNoiseL2Loss=0.0091
+ throughput/total_tokens=1,920,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10002/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,920,384,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=10003/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,920,576,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=10004/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,920,768,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=10005/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,920,960,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10006/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,921,152,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=10007/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,921,344,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10008/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,921,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10009/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,921,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10010/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=1,921,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10011/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,922,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10012/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,922,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10013/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,922,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10014/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,922,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10015/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,922,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10016/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,923,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10017/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,923,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10018/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,923,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10019/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,923,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10020/500000]
+ optim/total_grad_norm=1.149
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,923,840,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10021/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,924,032,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10022/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,924,224,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10023/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,924,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10024/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,924,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10025/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=1,924,800,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10026/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,924,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10027/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,925,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10028/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,925,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10029/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,925,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10030/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,925,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10031/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,925,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10032/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,926,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10033/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,926,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10034/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,926,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10035/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,926,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10036/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,926,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10037/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,927,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10038/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,927,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10039/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,927,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10040/500000]
+ optim/total_grad_norm=1.183
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,927,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10041/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,927,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10042/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,928,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10043/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,928,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10044/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,928,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10045/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,928,640,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10046/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,928,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10047/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,929,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10048/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,929,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10049/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,929,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10050/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,929,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10051/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,929,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10052/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,929,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10053/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,930,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10054/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,930,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10055/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,930,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10056/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,930,752,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10057/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,930,944,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10058/500000]
+ train/ActionNoiseL2Loss=0.0122
+ throughput/total_tokens=1,931,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10059/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,931,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10060/500000]
+ optim/total_grad_norm=1.007
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,931,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10061/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=1,931,712,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10062/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,931,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10063/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,932,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10064/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,932,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10065/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,932,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10066/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,932,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10067/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,932,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10068/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,933,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10069/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,933,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10070/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,933,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10071/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,933,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10072/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,933,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10073/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,934,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10074/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,934,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10075/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,934,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10076/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,934,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10077/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=1,934,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10078/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,934,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10079/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,935,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10080/500000]
+ optim/total_grad_norm=1.148
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,935,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10081/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,935,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10082/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,935,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10083/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,935,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10084/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=1,936,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10085/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,936,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10086/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,936,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10087/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,936,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10088/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,936,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10089/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,937,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10090/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,937,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10091/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=1,937,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10092/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=1,937,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10093/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,937,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10094/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,938,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10095/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,938,240,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10096/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,938,432,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10097/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,938,624,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10098/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,938,816,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10099/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,939,008,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10100/500000]
+ optim/total_grad_norm=0.7384
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,939,200,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10101/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,939,392,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=10102/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,939,584,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=10103/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,939,776,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10104/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,939,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10105/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,940,160,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10106/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,940,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10107/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,940,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10108/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,940,736,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10109/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,940,928,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10110/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,941,120,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10111/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,941,312,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10112/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,941,504,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10113/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,941,696,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10114/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,941,888,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10115/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,942,080,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10116/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,942,272,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10117/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,942,464,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10118/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,942,656,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10119/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,942,848,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10120/500000]
+ optim/total_grad_norm=1.363
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,943,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10121/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,943,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10122/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,943,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10123/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,943,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10124/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,943,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10125/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,944,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10126/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,944,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10127/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,944,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10128/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,944,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10129/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,944,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10130/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,944,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10131/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,945,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10132/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,945,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10133/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,945,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10134/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,945,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10135/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,945,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10136/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,946,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10137/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,946,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10138/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,946,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10139/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,946,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10140/500000]
+ optim/total_grad_norm=1.035
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,946,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10141/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=1,947,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10142/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,947,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10143/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,947,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10144/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,947,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10145/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,947,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10146/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,948,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10147/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,948,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10148/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,948,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10149/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,948,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10150/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,948,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10151/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,948,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10152/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,949,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10153/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,949,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10154/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,949,568,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10155/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,949,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10156/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,949,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10157/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,950,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10158/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,950,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10159/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,950,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10160/500000]
+ optim/total_grad_norm=0.6704
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,950,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10161/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,950,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10162/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,951,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10163/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,951,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10164/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,951,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10165/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,951,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10166/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,951,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10167/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,952,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10168/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,952,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10169/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,952,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10170/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,952,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10171/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,952,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10172/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,953,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10173/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,953,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10174/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,953,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10175/500000]
+ train/ActionNoiseL2Loss=0.0103
+ throughput/total_tokens=1,953,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10176/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,953,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10177/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,953,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10178/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=1,954,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10179/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,954,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10180/500000]
+ optim/total_grad_norm=0.8936
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,954,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10181/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,954,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10182/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,954,944,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10183/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,955,136,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10184/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,955,328,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10185/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,955,520,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10186/500000]
+ train/ActionNoiseL2Loss=0.0114
+ throughput/total_tokens=1,955,712,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10187/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,955,904,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10188/500000]
+ train/ActionNoiseL2Loss=0.0129
+ throughput/total_tokens=1,956,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10189/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,956,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10190/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,956,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10191/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,956,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10192/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,956,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10193/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,957,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10194/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,957,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10195/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,957,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10196/500000]
+ train/ActionNoiseL2Loss=0.0082
+ throughput/total_tokens=1,957,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10197/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,957,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10198/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,958,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10199/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,958,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10200/500000]
+ optim/total_grad_norm=0.8790
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,958,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10201/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,958,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10202/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,958,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10203/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,958,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10204/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,959,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10205/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,959,360,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10206/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,959,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10207/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,959,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10208/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,959,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10209/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,960,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10210/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,960,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10211/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,960,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10212/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,960,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10213/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,960,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10214/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,961,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10215/500000]
+ train/ActionNoiseL2Loss=0.0106
+ throughput/total_tokens=1,961,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10216/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=1,961,472,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10217/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,961,664,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10218/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,961,856,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10219/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,962,048,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10220/500000]
+ optim/total_grad_norm=0.8824
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,962,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10221/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,962,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10222/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,962,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10223/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,962,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10224/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,963,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10225/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,963,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10226/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,963,392,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10227/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,963,584,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10228/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,963,776,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10229/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,963,968,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10230/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,964,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10231/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,964,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10232/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,964,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10233/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,964,736,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10234/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,964,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10235/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,965,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10236/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,965,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10237/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,965,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10238/500000]
+ train/ActionNoiseL2Loss=0.0114
+ throughput/total_tokens=1,965,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10239/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,965,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10240/500000]
+ optim/total_grad_norm=1.061
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,966,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10241/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,966,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10242/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,966,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10243/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,966,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10244/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,966,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10245/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,967,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10246/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,967,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10247/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,967,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10248/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,967,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10249/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,967,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10250/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,968,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10251/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,968,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10252/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,968,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10253/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,968,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10254/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,968,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10255/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,968,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10256/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,969,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10257/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,969,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10258/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,969,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10259/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,969,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10260/500000]
+ optim/total_grad_norm=0.8017
+ train/ActionNoiseL2Loss=0.0093
+ throughput/total_tokens=1,969,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10261/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,970,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10262/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,970,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10263/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,970,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10264/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,970,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10265/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,970,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10266/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,971,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10267/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,971,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10268/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,971,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10269/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,971,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10270/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,971,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10271/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,972,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10272/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,972,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10273/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,972,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10274/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,972,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10275/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,972,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10276/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,972,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10277/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,973,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10278/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,973,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10279/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,973,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10280/500000]
+ optim/total_grad_norm=1.170
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,973,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10281/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,973,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10282/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,974,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10283/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,974,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10284/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,974,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10285/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=1,974,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10286/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,974,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10287/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,975,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10288/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=1,975,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10289/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,975,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10290/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,975,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10291/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,975,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10292/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=1,976,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10293/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,976,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10294/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,976,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10295/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,976,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10296/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,976,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10297/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,977,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10298/500000]
+ train/ActionNoiseL2Loss=0.0129
+ throughput/total_tokens=1,977,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10299/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,977,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10300/500000]
+ optim/total_grad_norm=0.6610
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,977,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10301/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,977,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10302/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,977,984,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10303/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,978,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10304/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,978,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10305/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,978,560,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10306/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,978,752,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10307/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,978,944,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10308/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,979,136,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10309/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,979,328,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10310/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,979,520,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10311/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,979,712,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10312/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,979,904,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10313/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,980,096,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10314/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,980,288,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10315/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,980,480,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10316/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,980,672,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10317/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,980,864,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10318/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,981,056,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10319/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,981,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10320/500000]
+ optim/total_grad_norm=0.9461
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,981,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10321/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,981,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10322/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,981,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10323/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,982,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10324/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,982,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10325/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,982,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10326/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,982,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10327/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,982,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10328/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,982,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10329/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,983,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10330/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,983,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10331/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,983,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10332/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=1,983,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10333/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,983,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10334/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,984,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10335/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,984,320,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10336/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,984,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10337/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,984,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10338/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,984,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10339/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=1,985,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10340/500000]
+ optim/total_grad_norm=0.8386
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=1,985,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10341/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,985,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10342/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,985,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10343/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,985,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10344/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,986,048,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10345/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,986,240,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10346/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,986,432,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10347/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,986,624,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10348/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,986,816,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10349/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,987,008,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10350/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,987,200,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10351/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,987,392,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10352/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,987,584,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10353/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,987,776,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10354/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,987,968,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10355/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,988,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10356/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,988,352,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10357/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,988,544,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10358/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,988,736,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10359/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,988,928,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10360/500000]
+ optim/total_grad_norm=1.030
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,989,120,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10361/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,989,312,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10362/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,989,504,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10363/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,989,696,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10364/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,989,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10365/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,990,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10366/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=1,990,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10367/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,990,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10368/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,990,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10369/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,990,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10370/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,991,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10371/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,991,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10372/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,991,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10373/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,991,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10374/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,991,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10375/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,992,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10376/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,992,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10377/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,992,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10378/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,992,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10379/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,992,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10380/500000]
+ optim/total_grad_norm=1.704
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,992,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10381/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,993,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10382/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,993,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10383/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,993,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10384/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,993,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10385/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,993,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10386/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,994,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10387/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,994,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10388/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,994,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10389/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,994,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10390/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,994,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10391/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,995,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10392/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,995,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10393/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,995,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10394/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,995,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10395/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,995,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10396/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,996,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10397/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,996,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10398/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,996,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10399/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,996,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10400/500000]
+ optim/total_grad_norm=0.7499
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,996,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10401/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,996,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10402/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,997,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10403/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,997,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10404/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,997,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10405/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,997,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10406/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,997,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10407/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,998,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10408/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,998,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10409/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,998,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10410/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,998,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10411/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,998,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10412/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,999,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10413/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,999,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10414/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,999,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10415/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,999,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10416/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,999,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10417/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,000,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10418/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,000,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10419/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,000,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10420/500000]
+ optim/total_grad_norm=0.9345
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,000,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10421/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,000,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10422/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,001,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10423/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,001,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10424/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,001,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10425/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,001,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10426/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=2,001,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10427/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=2,001,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10428/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,002,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10429/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,002,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10430/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,002,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10431/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,002,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10432/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,002,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10433/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=2,003,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10434/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,003,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10435/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,003,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10436/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=2,003,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10437/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,003,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10438/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,004,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10439/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=2,004,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10440/500000]
+ optim/total_grad_norm=0.8630
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,004,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10441/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,004,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10442/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,004,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10443/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,005,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10444/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,005,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10445/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,005,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10446/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=2,005,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10447/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,005,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10448/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=2,006,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10449/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,006,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10450/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,006,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10451/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=2,006,592,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10452/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,006,784,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10453/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,006,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10454/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=2,007,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10455/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=2,007,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10456/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,007,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10457/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=2,007,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10458/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,007,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10459/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=2,008,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10460/500000]
+ optim/total_grad_norm=1.646
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=2,008,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10461/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=2,008,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10462/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,008,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10463/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=2,008,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10464/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=2,009,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10465/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,009,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10466/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,009,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10467/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,009,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10468/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,009,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10469/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,010,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10470/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,010,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10471/500000]
+ train/ActionNoiseL2Loss=0.0105
+ throughput/total_tokens=2,010,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10472/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=2,010,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10473/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=2,010,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10474/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=2,011,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10475/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,011,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10476/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=2,011,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10477/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,011,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10478/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=2,011,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10479/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,011,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10480/500000]
+ optim/total_grad_norm=1.166
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,012,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10481/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,012,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10482/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,012,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10483/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,012,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10484/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,012,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10485/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,013,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10486/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,013,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10487/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,013,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10488/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,013,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10489/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=2,013,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10490/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,014,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10491/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,014,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10492/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,014,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10493/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,014,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10494/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,014,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10495/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=2,015,040,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10496/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,015,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10497/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,015,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10498/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,015,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10499/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,015,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10500/500000]
+ optim/total_grad_norm=1.060
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,016,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/26 [23:28:37] INFO | >> Saving config... checkpoint.py:608
+09/26 [23:29:07] INFO | >> Saving model state... checkpoint.py:796
+09/26 [23:30:08] INFO | >> Saving optim state... checkpoint.py:811
+09/26 [23:30:13] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10501/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,016,192,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=10502/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,016,384,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=10503/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,016,576,000
+ throughput/device/tokens_per_second=1,100
+ throughput/device/batches_per_second=0.0459
+[step=10504/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,016,768,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=10505/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,016,960,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=10506/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,017,152,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=10507/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,017,344,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=10508/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=2,017,536,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=10509/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,017,728,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=10510/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=2,017,920,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,437
+[step=10511/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,018,112,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=10512/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,018,304,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=10513/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,018,496,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=10514/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,018,688,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=10515/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,018,880,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=10516/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=2,019,072,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=10517/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,019,264,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=10518/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,019,456,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=10519/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,019,648,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10520/500000]
+ optim/total_grad_norm=0.8782
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,019,840,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=10521/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=2,020,032,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=10522/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=2,020,224,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10523/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=2,020,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10524/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,020,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10525/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=2,020,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10526/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,020,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10527/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,021,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10528/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,021,376,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10529/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,021,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10530/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,021,760,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10531/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,021,952,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10532/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=2,022,144,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10533/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=2,022,336,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10534/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,022,528,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10535/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,022,720,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10536/500000]
+ train/ActionNoiseL2Loss=0.0098
+ throughput/total_tokens=2,022,912,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10537/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=2,023,104,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10538/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,023,296,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10539/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,023,488,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10540/500000]
+ optim/total_grad_norm=1.298
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,023,680,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10541/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,023,872,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10542/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,024,064,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10543/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,024,256,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10544/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,024,448,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10545/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,024,640,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10546/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,024,832,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10547/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,025,024,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10548/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,025,216,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10549/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,025,408,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10550/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,025,600,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10551/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,025,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10552/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,025,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10553/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,026,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10554/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,026,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10555/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,026,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10556/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=2,026,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10557/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,026,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10558/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=2,027,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10559/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,027,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10560/500000]
+ optim/total_grad_norm=1.050
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,027,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10561/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,027,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10562/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,027,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10563/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,028,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10564/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,028,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10565/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,028,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10566/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,028,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10567/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,028,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10568/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=2,029,056,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10569/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,029,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10570/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,029,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10571/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,029,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10572/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,029,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10573/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=2,030,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10574/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,030,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10575/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,030,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10576/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,030,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10577/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=2,030,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10578/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,030,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10579/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,031,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10580/500000]
+ optim/total_grad_norm=0.9914
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,031,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10581/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=2,031,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10582/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,031,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10583/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,031,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10584/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,032,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10585/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=2,032,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10586/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,032,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10587/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,032,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10588/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,032,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10589/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,033,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10590/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,033,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10591/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=2,033,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10592/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,033,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10593/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=2,033,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10594/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,034,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10595/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=2,034,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10596/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=2,034,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10597/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,034,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10598/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,034,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10599/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,035,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10600/500000]
+ optim/total_grad_norm=0.9922
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,035,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10601/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=2,035,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10602/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,035,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10603/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,035,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10604/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,035,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10605/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,036,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10606/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=2,036,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10607/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,036,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10608/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=2,036,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10609/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,036,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10610/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,037,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10611/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,037,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10612/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,037,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10613/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=2,037,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10614/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,037,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10615/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=2,038,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10616/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,038,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10617/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,038,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10618/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,038,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10619/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,038,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10620/500000]
+ optim/total_grad_norm=0.9684
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,039,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10621/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,039,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10622/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,039,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10623/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,039,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10624/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,039,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10625/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,040,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10626/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,040,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10627/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,040,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10628/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,040,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10629/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,040,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10630/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=2,040,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10631/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,041,152,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10632/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=2,041,344,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10633/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,041,536,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10634/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,041,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10635/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,041,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10636/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,042,112,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10637/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,042,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10638/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,042,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10639/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,042,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10640/500000]
+ optim/total_grad_norm=0.9891
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,042,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10641/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,043,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10642/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,043,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10643/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,043,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10644/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,043,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10645/500000]
+ train/ActionNoiseL2Loss=0.0084
+ throughput/total_tokens=2,043,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10646/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,044,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10647/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,044,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10648/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,044,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10649/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,044,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10650/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,044,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10651/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,044,992,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10652/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=2,045,184,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10653/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=2,045,376,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10654/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,045,568,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10655/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=2,045,760,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10656/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,045,952,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10657/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,046,144,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10658/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=2,046,336,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10659/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=2,046,528,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10660/500000]
+ optim/total_grad_norm=1.136
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=2,046,720,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10661/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=2,046,912,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10662/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,047,104,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10663/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,047,296,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10664/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=2,047,488,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10665/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,047,680,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10666/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,047,872,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10667/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,048,064,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10668/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,048,256,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10669/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,048,448,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=10670/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=2,048,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10671/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,048,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10672/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,049,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10673/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,049,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10674/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,049,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10675/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,049,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10676/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,049,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10677/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,049,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=10678/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,050,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10679/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,050,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10680/500000]
+ optim/total_grad_norm=1.868
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=2,050,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10681/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,050,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10682/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,050,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10683/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,051,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10684/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,051,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10685/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,051,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10686/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=2,051,712,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10687/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,051,904,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10688/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,052,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10689/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,052,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10690/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,052,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10691/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,052,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10692/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=2,052,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10693/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,053,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10694/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,053,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10695/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=2,053,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10696/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,053,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10697/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,053,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10698/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=2,054,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10699/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,054,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10700/500000]
+ optim/total_grad_norm=0.8125
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,054,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10701/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,054,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10702/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,054,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10703/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,054,976,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10704/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,055,168,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10705/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,055,360,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10706/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,055,552,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10707/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,055,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10708/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,055,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10709/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=2,056,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10710/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,056,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10711/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=2,056,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10712/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,056,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10713/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,056,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10714/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,057,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10715/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,057,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10716/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,057,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10717/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,057,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10718/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,057,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10719/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,058,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10720/500000]
+ optim/total_grad_norm=0.7196
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,058,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10721/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,058,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10722/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=2,058,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10723/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=2,058,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10724/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,059,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10725/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,059,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10726/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=2,059,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10727/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,059,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10728/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,059,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10729/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,059,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10730/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,060,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10731/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,060,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10732/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,060,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10733/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,060,736,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10734/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,060,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10735/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,061,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10736/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,061,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10737/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=2,061,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10738/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,061,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10739/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,061,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10740/500000]
+ optim/total_grad_norm=0.9907
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,062,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10741/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,062,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10742/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=2,062,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10743/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,062,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10744/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,062,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10745/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,063,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10746/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,063,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10747/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,063,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10748/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,063,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10749/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,063,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10750/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,064,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10751/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,064,192,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10752/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,064,384,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10753/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=2,064,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10754/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,064,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10755/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,064,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10756/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,065,152,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10757/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=2,065,344,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10758/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,065,536,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10759/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,065,728,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10760/500000]
+ optim/total_grad_norm=1.518
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,065,920,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10761/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,066,112,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=10762/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,066,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10763/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,066,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10764/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,066,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10765/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,066,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10766/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,067,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10767/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,067,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10768/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,067,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10769/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,067,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10770/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,067,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10771/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,068,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10772/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,068,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10773/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=2,068,416,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10774/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=2,068,608,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10775/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,068,800,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10776/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,068,992,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10777/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=2,069,184,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10778/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,069,376,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10779/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=2,069,568,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10780/500000]
+ optim/total_grad_norm=0.8177
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,069,760,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10781/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,069,952,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10782/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,070,144,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10783/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,070,336,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10784/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,070,528,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10785/500000]
+ train/ActionNoiseL2Loss=0.0088
+ throughput/total_tokens=2,070,720,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10786/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=2,070,912,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10787/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,071,104,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10788/500000]
+ train/ActionNoiseL2Loss=0.0107
+ throughput/total_tokens=2,071,296,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10789/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,071,488,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10790/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=2,071,680,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10791/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,071,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10792/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,072,064,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10793/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,072,256,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10794/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,072,448,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10795/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,072,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10796/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,072,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10797/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,073,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10798/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,073,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10799/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,073,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10800/500000]
+ optim/total_grad_norm=0.9075
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,073,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10801/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,073,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10802/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,073,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10803/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,074,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10804/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=2,074,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10805/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,074,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10806/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,074,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10807/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,074,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10808/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,075,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10809/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,075,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10810/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,075,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10811/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=2,075,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10812/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,075,904,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10813/500000]
+ train/ActionNoiseL2Loss=0.0089
+ throughput/total_tokens=2,076,096,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10814/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,076,288,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10815/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,076,480,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10816/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,076,672,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10817/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,076,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10818/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,077,056,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10819/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,077,248,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10820/500000]
+ optim/total_grad_norm=1.025
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,077,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10821/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,077,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10822/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,077,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10823/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,078,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10824/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,078,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10825/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=2,078,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10826/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,078,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10827/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=2,078,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10828/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,078,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10829/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,079,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10830/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,079,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10831/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,079,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10832/500000]
+ train/ActionNoiseL2Loss=0.0114
+ throughput/total_tokens=2,079,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10833/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=2,079,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10834/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=2,080,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10835/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,080,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10836/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,080,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10837/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,080,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10838/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,080,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10839/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,081,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10840/500000]
+ optim/total_grad_norm=0.9781
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,081,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10841/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,081,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10842/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,081,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10843/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,081,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10844/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,082,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10845/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,082,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10846/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,082,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10847/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,082,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10848/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=2,082,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10849/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=2,083,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10850/500000]
+ train/ActionNoiseL2Loss=0.0099
+ throughput/total_tokens=2,083,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10851/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,083,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10852/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,083,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10853/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,083,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10854/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,083,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10855/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,084,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10856/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,084,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10857/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,084,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10858/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,084,736,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10859/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,084,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10860/500000]
+ optim/total_grad_norm=1.413
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=2,085,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10861/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,085,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10862/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,085,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10863/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,085,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10864/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,085,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10865/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,086,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10866/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,086,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10867/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,086,464,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10868/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,086,656,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10869/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,086,848,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10870/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,087,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10871/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,087,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10872/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,087,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10873/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,087,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10874/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,087,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10875/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=2,088,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10876/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,088,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10877/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=2,088,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10878/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,088,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10879/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,088,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10880/500000]
+ optim/total_grad_norm=0.8154
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,088,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10881/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=2,089,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10882/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,089,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10883/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,089,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10884/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,089,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10885/500000]
+ train/ActionNoiseL2Loss=0.0079
+ throughput/total_tokens=2,089,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10886/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,090,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10887/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,090,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10888/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,090,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10889/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,090,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10890/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,090,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10891/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,091,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10892/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,091,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10893/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,091,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10894/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,091,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10895/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=2,091,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10896/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,092,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10897/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,092,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10898/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,092,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10899/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=2,092,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10900/500000]
+ optim/total_grad_norm=1.342
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=2,092,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10901/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,092,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=10902/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,093,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10903/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,093,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10904/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=2,093,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10905/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,093,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10906/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,093,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10907/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,094,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10908/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,094,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10909/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,094,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10910/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=2,094,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10911/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,094,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10912/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=2,095,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10913/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,095,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10914/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=2,095,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10915/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=2,095,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10916/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,095,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10917/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,096,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10918/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,096,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10919/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,096,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10920/500000]
+ optim/total_grad_norm=1.302
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,096,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10921/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=2,096,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10922/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,097,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10923/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=2,097,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10924/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,097,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10925/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,097,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10926/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,097,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10927/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,097,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10928/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,098,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10929/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,098,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10930/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,098,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10931/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=2,098,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10932/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,098,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10933/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,099,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10934/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,099,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10935/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,099,520,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10936/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,099,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10937/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,099,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10938/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,100,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10939/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=2,100,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10940/500000]
+ optim/total_grad_norm=1.137
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,100,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=10941/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,100,672,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10942/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,100,864,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=10943/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=2,101,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10944/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,101,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10945/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,101,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10946/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,101,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10947/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,101,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10948/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,102,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10949/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,102,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10950/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,102,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10951/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,102,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10952/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,102,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10953/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,102,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10954/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,103,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10955/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,103,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10956/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,103,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10957/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,103,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10958/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,103,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10959/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,104,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10960/500000]
+ optim/total_grad_norm=1.515
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,104,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=10961/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,104,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10962/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=2,104,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10963/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=2,104,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10964/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,105,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10965/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,105,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10966/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,105,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10967/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=2,105,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10968/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=2,105,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10969/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=2,106,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=10970/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,106,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10971/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,106,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10972/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,106,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10973/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,106,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10974/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,107,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10975/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,107,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10976/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=2,107,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10977/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,107,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10978/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,107,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10979/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,107,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10980/500000]
+ optim/total_grad_norm=1.025
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,108,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10981/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,108,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10982/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=2,108,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10983/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=2,108,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=10984/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,108,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10985/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,109,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10986/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,109,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10987/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,109,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10988/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=2,109,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10989/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,109,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10990/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,110,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=10991/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,110,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10992/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,110,464,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10993/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,110,656,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10994/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,110,848,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10995/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=2,111,040,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10996/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,111,232,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10997/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,111,424,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10998/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,111,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=10999/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,111,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11000/500000]
+ optim/total_grad_norm=1.051
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=2,112,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+09/27 [02:28:39] INFO | >> Saving config... checkpoint.py:608
+09/27 [02:29:12] INFO | >> Saving model state... checkpoint.py:796
+09/27 [02:30:11] INFO | >> Saving optim state... checkpoint.py:811
+09/27 [02:30:16] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11001/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=2,112,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11002/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,112,384,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11003/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,112,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11004/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=2,112,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11005/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,112,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11006/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,113,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11007/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=2,113,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11008/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,113,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11009/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,113,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11010/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,113,920,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11011/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,114,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11012/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,114,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11013/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,114,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11014/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,114,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11015/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,114,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11016/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,115,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11017/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,115,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11018/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,115,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11019/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,115,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11020/500000]
+ optim/total_grad_norm=0.9366
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,115,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11021/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,116,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11022/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=2,116,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11023/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,116,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11024/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,116,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11025/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,116,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11026/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,116,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11027/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=2,117,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11028/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,117,376,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11029/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,117,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11030/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,117,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11031/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,117,952,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11032/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,118,144,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11033/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,118,336,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11034/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,118,528,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11035/500000]
+ train/ActionNoiseL2Loss=0.0073
+ throughput/total_tokens=2,118,720,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11036/500000]
+ train/ActionNoiseL2Loss=0.0090
+ throughput/total_tokens=2,118,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11037/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,119,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11038/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,119,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11039/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,119,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11040/500000]
+ optim/total_grad_norm=0.8477
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,119,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11041/500000]
+ train/ActionNoiseL2Loss=0.0110
+ throughput/total_tokens=2,119,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11042/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,120,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11043/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,120,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11044/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,120,448,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11045/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,120,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11046/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=2,120,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11047/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,121,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11048/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,121,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11049/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,121,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11050/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,121,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11051/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,121,792,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11052/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=2,121,984,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11053/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,122,176,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11054/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,122,368,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11055/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=2,122,560,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11056/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,122,752,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11057/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,122,944,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11058/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,123,136,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11059/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=2,123,328,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11060/500000]
+ optim/total_grad_norm=0.8087
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,123,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11061/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,123,712,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11062/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,123,904,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11063/500000]
+ train/ActionNoiseL2Loss=0.0099
+ throughput/total_tokens=2,124,096,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11064/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,124,288,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11065/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,124,480,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11066/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,124,672,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11067/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,124,864,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11068/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=2,125,056,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11069/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=2,125,248,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11070/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=2,125,440,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11071/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,125,632,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11072/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,125,824,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11073/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=2,126,016,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11074/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,126,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11075/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,126,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11076/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=2,126,592,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11077/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,126,784,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11078/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=2,126,976,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11079/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,127,168,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11080/500000]
+ optim/total_grad_norm=1.549
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,127,360,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11081/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,127,552,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11082/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,127,744,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11083/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=2,127,936,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11084/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,128,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11085/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,128,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11086/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=2,128,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11087/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,128,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11088/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=2,128,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11089/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=2,129,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11090/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,129,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11091/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,129,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11092/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,129,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11093/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,129,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11094/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,130,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11095/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,130,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11096/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,130,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11097/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,130,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11098/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=2,130,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11099/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,131,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11100/500000]
+ optim/total_grad_norm=1.055
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,131,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11101/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=2,131,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11102/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=2,131,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11103/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,131,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11104/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,131,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11105/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,132,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11106/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,132,352,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11107/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=2,132,544,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11108/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,132,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11109/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=2,132,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11110/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,133,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11111/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,133,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11112/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,133,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11113/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,133,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11114/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,133,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11115/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,134,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11116/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=2,134,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11117/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,134,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11118/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=2,134,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11119/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,134,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11120/500000]
+ optim/total_grad_norm=0.9736
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,135,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11121/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=2,135,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11122/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,135,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11123/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,135,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11124/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,135,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11125/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,136,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11126/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,136,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11127/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,136,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11128/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,136,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11129/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,136,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11130/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,136,960,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11131/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,137,152,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11132/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,137,344,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11133/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=2,137,536,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11134/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=2,137,728,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11135/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,137,920,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11136/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,138,112,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11137/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,138,304,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11138/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=2,138,496,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11139/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,138,688,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11140/500000]
+ optim/total_grad_norm=1.028
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=2,138,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11141/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=2,139,072,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11142/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,139,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11143/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,139,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11144/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,139,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11145/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,139,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11146/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,140,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11147/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=2,140,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11148/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,140,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11149/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,140,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11150/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,140,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11151/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,140,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11152/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,141,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11153/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=2,141,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11154/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,141,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11155/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,141,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11156/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=2,141,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11157/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=2,142,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11158/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=2,142,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11159/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=2,142,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11160/500000]
+ optim/total_grad_norm=0.9037
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,142,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11161/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,142,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11162/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,143,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11163/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,143,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11164/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,143,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11165/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,143,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11166/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,143,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11167/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,144,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11168/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,144,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11169/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,144,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11170/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,144,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11171/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,144,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11172/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,145,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11173/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=2,145,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11174/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,145,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11175/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,145,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11176/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=2,145,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11177/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,145,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11178/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,146,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11179/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,146,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11180/500000]
+ optim/total_grad_norm=0.8660
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,146,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11181/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,146,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11182/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,146,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11183/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=2,147,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11184/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,147,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11185/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,147,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11186/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,147,712,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11187/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,147,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11188/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,148,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11189/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=2,148,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11190/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,148,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11191/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,148,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11192/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,148,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11193/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,149,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11194/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=2,149,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11195/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,149,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11196/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,149,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11197/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,149,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11198/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,150,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11199/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=2,150,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11200/500000]
+ optim/total_grad_norm=0.8271
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,150,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11201/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,150,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11202/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,150,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11203/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,150,976,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11204/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=2,151,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11205/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=2,151,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11206/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=2,151,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11207/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,151,744,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11208/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,151,936,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11209/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,152,128,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11210/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,152,320,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11211/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,152,512,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11212/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=2,152,704,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11213/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,152,896,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11214/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,153,088,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11215/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,153,280,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11216/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,153,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11217/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,153,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11218/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,153,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11219/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,154,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11220/500000]
+ optim/total_grad_norm=0.9621
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,154,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11221/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,154,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11222/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,154,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11223/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,154,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11224/500000]
+ train/ActionNoiseL2Loss=0.0114
+ throughput/total_tokens=2,155,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11225/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=2,155,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11226/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,155,392,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11227/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,155,584,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11228/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,155,776,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11229/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,155,968,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11230/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,156,160,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11231/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,156,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11232/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=2,156,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11233/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,156,736,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11234/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,156,928,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11235/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=2,157,120,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11236/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=2,157,312,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11237/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,157,504,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11238/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=2,157,696,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11239/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=2,157,888,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11240/500000]
+ optim/total_grad_norm=1.087
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,158,080,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11241/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,158,272,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11242/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,158,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11243/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,158,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11244/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,158,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11245/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,159,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11246/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,159,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11247/500000]
+ train/ActionNoiseL2Loss=0.0101
+ throughput/total_tokens=2,159,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11248/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,159,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11249/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=2,159,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11250/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,160,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11251/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,160,192,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11252/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,160,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11253/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,160,576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11254/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,160,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11255/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,160,960,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11256/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,161,152,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11257/500000]
+ train/ActionNoiseL2Loss=0.0119
+ throughput/total_tokens=2,161,344,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11258/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,161,536,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11259/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,161,728,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11260/500000]
+ optim/total_grad_norm=0.8295
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,161,920,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11261/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=2,162,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11262/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,162,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11263/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,162,496,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11264/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,162,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11265/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,162,880,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11266/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,163,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11267/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,163,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11268/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,163,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11269/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=2,163,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11270/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,163,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11271/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=2,164,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11272/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,164,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11273/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,164,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11274/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,164,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11275/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,164,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11276/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,164,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11277/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,165,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11278/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,165,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11279/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,165,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11280/500000]
+ optim/total_grad_norm=1.021
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,165,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11281/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,165,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11282/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,166,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11283/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,166,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11284/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,166,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11285/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,166,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11286/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,166,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11287/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,167,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11288/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,167,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11289/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,167,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11290/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,167,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11291/500000]
+ train/ActionNoiseL2Loss=0.0105
+ throughput/total_tokens=2,167,872,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11292/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,168,064,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11293/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=2,168,256,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11294/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=2,168,448,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11295/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,168,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11296/500000]
+ train/ActionNoiseL2Loss=0.0093
+ throughput/total_tokens=2,168,832,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11297/500000]
+ train/ActionNoiseL2Loss=0.0095
+ throughput/total_tokens=2,169,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11298/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,169,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11299/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,169,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11300/500000]
+ optim/total_grad_norm=1.126
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,169,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11301/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,169,792,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11302/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,169,984,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11303/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,170,176,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11304/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,170,368,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11305/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,170,560,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11306/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,170,752,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11307/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,170,944,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11308/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,171,136,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=11309/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,171,328,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=11310/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,171,520,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11311/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,171,712,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11312/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=2,171,904,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11313/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,172,096,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11314/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,172,288,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11315/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,172,480,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11316/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,172,672,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11317/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,172,864,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11318/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,173,056,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11319/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,173,248,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11320/500000]
+ optim/total_grad_norm=1.034
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,173,440,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11321/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,173,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11322/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,173,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11323/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,174,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11324/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,174,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11325/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,174,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11326/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,174,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11327/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,174,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11328/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=2,174,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11329/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,175,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11330/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,175,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11331/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,175,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11332/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,175,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11333/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,175,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11334/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=2,176,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11335/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,176,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11336/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,176,512,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11337/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,176,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11338/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,176,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11339/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,177,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11340/500000]
+ optim/total_grad_norm=1.044
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,177,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11341/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,177,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11342/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,177,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11343/500000]
+ train/ActionNoiseL2Loss=0.0114
+ throughput/total_tokens=2,177,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11344/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=2,178,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11345/500000]
+ train/ActionNoiseL2Loss=0.0110
+ throughput/total_tokens=2,178,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11346/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,178,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11347/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,178,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11348/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,178,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11349/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,179,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11350/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,179,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11351/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,179,392,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11352/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=2,179,584,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11353/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,179,776,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11354/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,179,968,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11355/500000]
+ train/ActionNoiseL2Loss=0.0112
+ throughput/total_tokens=2,180,160,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11356/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,180,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11357/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,180,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11358/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,180,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11359/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,180,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11360/500000]
+ optim/total_grad_norm=1.093
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,181,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11361/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,181,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11362/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,181,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11363/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=2,181,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11364/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,181,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11365/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,182,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11366/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,182,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11367/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=2,182,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11368/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=2,182,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11369/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,182,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11370/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=2,183,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11371/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,183,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11372/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,183,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11373/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,183,616,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11374/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,183,808,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11375/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=2,184,000,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11376/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,184,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11377/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,184,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11378/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,184,576,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11379/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,184,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11380/500000]
+ optim/total_grad_norm=1.053
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,184,960,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11381/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,185,152,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11382/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=2,185,344,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11383/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,185,536,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11384/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,185,728,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11385/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=2,185,920,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11386/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,186,112,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11387/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=2,186,304,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=11388/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=2,186,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11389/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=2,186,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11390/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=2,186,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11391/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,187,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11392/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=2,187,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11393/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,187,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11394/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,187,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11395/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,187,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11396/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,188,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11397/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=2,188,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11398/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,188,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11399/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,188,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11400/500000]
+ optim/total_grad_norm=0.9548
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,188,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11401/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,188,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11402/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,189,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11403/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=2,189,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11404/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,189,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11405/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,189,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11406/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,189,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11407/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,190,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11408/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,190,336,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11409/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,190,528,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11410/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,190,720,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11411/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,190,912,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11412/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,191,104,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11413/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,191,296,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11414/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=2,191,488,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11415/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,191,680,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11416/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,191,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11417/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,192,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11418/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,192,256,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11419/500000]
+ train/ActionNoiseL2Loss=0.0097
+ throughput/total_tokens=2,192,448,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11420/500000]
+ optim/total_grad_norm=1.195
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,192,640,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11421/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,192,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11422/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,193,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11423/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,193,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11424/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,193,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11425/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,193,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11426/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,193,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11427/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,193,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11428/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,194,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11429/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,194,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11430/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,194,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11431/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,194,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11432/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,194,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11433/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,195,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11434/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=2,195,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11435/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=2,195,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11436/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,195,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11437/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,195,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11438/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,196,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11439/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,196,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11440/500000]
+ optim/total_grad_norm=1.036
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,196,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11441/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,196,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11442/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,196,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11443/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,197,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11444/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,197,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11445/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,197,440,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11446/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,197,632,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11447/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,197,824,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11448/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,198,016,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11449/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,198,208,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11450/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,198,400,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11451/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,198,592,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11452/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,198,784,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11453/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=2,198,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11454/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,199,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11455/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,199,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11456/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,199,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11457/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,199,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11458/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=2,199,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11459/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,200,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11460/500000]
+ optim/total_grad_norm=0.8453
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,200,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11461/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=2,200,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11462/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,200,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11463/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,200,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11464/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,201,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11465/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,201,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11466/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,201,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11467/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,201,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11468/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,201,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11469/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,202,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11470/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,202,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11471/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=2,202,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11472/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,202,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11473/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=2,202,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11474/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,203,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11475/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=2,203,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11476/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,203,392,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11477/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,203,584,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11478/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,203,776,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11479/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,203,968,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11480/500000]
+ optim/total_grad_norm=0.8924
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,204,160,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11481/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,204,352,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11482/500000]
+ train/ActionNoiseL2Loss=0.0096
+ throughput/total_tokens=2,204,544,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11483/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,204,736,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11484/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,204,928,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11485/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=2,205,120,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11486/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=2,205,312,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11487/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,205,504,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11488/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,205,696,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11489/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=2,205,888,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11490/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,206,080,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11491/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,206,272,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11492/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,206,464,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11493/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,206,656,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11494/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,206,848,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11495/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,207,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11496/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,207,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11497/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,207,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11498/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,207,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11499/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,207,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11500/500000]
+ optim/total_grad_norm=1.054
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,208,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+09/27 [05:28:44] INFO | >> Saving config... checkpoint.py:608
+09/27 [05:29:15] INFO | >> Saving model state... checkpoint.py:796
+09/27 [05:30:15] INFO | >> Saving optim state... checkpoint.py:811
+09/27 [05:30:20] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11501/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,208,192,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=11502/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,208,384,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=11503/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,208,576,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=11504/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,208,768,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=11505/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,208,960,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=11506/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=2,209,152,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=11507/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=2,209,344,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=11508/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,209,536,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=11509/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,209,728,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11510/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,209,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11511/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,210,112,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11512/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,210,304,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11513/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,210,496,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11514/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,210,688,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11515/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,210,880,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11516/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,211,072,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11517/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,211,264,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11518/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,211,456,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11519/500000]
+ train/ActionNoiseL2Loss=0.0112
+ throughput/total_tokens=2,211,648,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11520/500000]
+ optim/total_grad_norm=0.7256
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,211,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11521/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,212,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11522/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=2,212,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11523/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,212,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11524/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,212,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11525/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,212,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11526/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,212,992,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11527/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=2,213,184,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11528/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,213,376,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11529/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,213,568,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11530/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=2,213,760,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11531/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,213,952,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11532/500000]
+ train/ActionNoiseL2Loss=0.0119
+ throughput/total_tokens=2,214,144,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11533/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,214,336,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11534/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,214,528,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11535/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=2,214,720,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11536/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,214,912,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11537/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,215,104,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11538/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,215,296,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11539/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=2,215,488,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11540/500000]
+ optim/total_grad_norm=1.162
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,215,680,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11541/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,215,872,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11542/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,216,064,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11543/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=2,216,256,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11544/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=2,216,448,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11545/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,216,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11546/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,216,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11547/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,217,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11548/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,217,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11549/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,217,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11550/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,217,600,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11551/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=2,217,792,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=11552/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,217,984,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=11553/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,218,176,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=11554/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,218,368,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=11555/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,218,560,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=11556/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,218,752,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=11557/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,218,944,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=11558/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,219,136,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=11559/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,219,328,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=11560/500000]
+ optim/total_grad_norm=0.8859
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,219,520,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+ System/Peak GPU Memory (MB)=44,437
+[step=11561/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,219,712,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=11562/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,219,904,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=11563/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,220,096,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11564/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=2,220,288,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11565/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,220,480,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11566/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=2,220,672,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11567/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,220,864,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11568/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,221,056,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=11569/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,221,248,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=11570/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,221,440,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11571/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,221,632,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11572/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=2,221,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11573/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=2,222,016,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11574/500000]
+ train/ActionNoiseL2Loss=0.0119
+ throughput/total_tokens=2,222,208,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11575/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,222,400,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11576/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,222,592,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11577/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,222,784,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11578/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=2,222,976,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11579/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,223,168,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11580/500000]
+ optim/total_grad_norm=0.9936
+ train/ActionNoiseL2Loss=0.0106
+ throughput/total_tokens=2,223,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11581/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,223,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11582/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,223,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11583/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=2,223,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11584/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,224,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11585/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,224,320,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11586/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,224,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11587/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,224,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11588/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,224,896,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11589/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,225,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11590/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=2,225,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11591/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,225,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11592/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,225,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11593/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,225,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11594/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,226,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11595/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,226,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11596/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,226,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11597/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,226,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11598/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=2,226,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11599/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,227,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11600/500000]
+ optim/total_grad_norm=0.9215
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,227,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11601/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,227,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11602/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,227,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11603/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,227,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11604/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,227,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11605/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=2,228,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11606/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,228,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11607/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,228,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11608/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=2,228,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11609/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,228,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11610/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=2,229,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11611/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=2,229,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11612/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,229,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11613/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,229,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11614/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,229,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11615/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=2,230,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11616/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,230,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11617/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=2,230,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11618/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=2,230,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11619/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,230,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11620/500000]
+ optim/total_grad_norm=0.8075
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,231,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11621/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=2,231,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11622/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,231,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11623/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=2,231,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11624/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,231,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11625/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,232,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11626/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=2,232,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11627/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=2,232,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11628/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=2,232,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11629/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,232,768,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11630/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,232,960,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11631/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,233,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11632/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=2,233,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11633/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,233,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11634/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=2,233,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11635/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,233,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11636/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,234,112,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11637/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,234,304,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11638/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,234,496,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11639/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,234,688,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11640/500000]
+ optim/total_grad_norm=1.075
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,234,880,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11641/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,235,072,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11642/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,235,264,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11643/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=2,235,456,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11644/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=2,235,648,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11645/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,235,840,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11646/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,236,032,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11647/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=2,236,224,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11648/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=2,236,416,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11649/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=2,236,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11650/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,236,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11651/500000]
+ train/ActionNoiseL2Loss=0.0096
+ throughput/total_tokens=2,236,992,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11652/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,237,184,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11653/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,237,376,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11654/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,237,568,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11655/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,237,760,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11656/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,237,952,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11657/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=2,238,144,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11658/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,238,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11659/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,238,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11660/500000]
+ optim/total_grad_norm=1.045
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,238,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11661/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=2,238,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11662/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,239,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11663/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=2,239,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11664/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,239,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11665/500000]
+ train/ActionNoiseL2Loss=0.0114
+ throughput/total_tokens=2,239,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11666/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,239,872,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11667/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,240,064,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11668/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,240,256,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11669/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,240,448,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11670/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,240,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11671/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,240,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11672/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,241,024,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11673/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,241,216,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11674/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,241,408,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11675/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,241,600,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11676/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,241,792,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11677/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,241,984,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11678/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,242,176,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11679/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,242,368,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11680/500000]
+ optim/total_grad_norm=0.4560
+ train/ActionNoiseL2Loss=0.0085
+ throughput/total_tokens=2,242,560,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11681/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,242,752,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11682/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=2,242,944,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11683/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,243,136,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11684/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,243,328,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11685/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,243,520,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11686/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,243,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11687/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,243,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11688/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,244,096,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11689/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,244,288,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11690/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,244,480,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11691/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,244,672,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11692/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,244,864,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11693/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,245,056,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11694/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,245,248,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11695/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,245,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11696/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,245,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11697/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,245,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11698/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,246,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11699/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=2,246,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11700/500000]
+ optim/total_grad_norm=1.553
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,246,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11701/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,246,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11702/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,246,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11703/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,246,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11704/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,247,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11705/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,247,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11706/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,247,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11707/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,247,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11708/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,247,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11709/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,248,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11710/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=2,248,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11711/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,248,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11712/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=2,248,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11713/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=2,248,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11714/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=2,249,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11715/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,249,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11716/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,249,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11717/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,249,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11718/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=2,249,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11719/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,250,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11720/500000]
+ optim/total_grad_norm=0.7273
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,250,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11721/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,250,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11722/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,250,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11723/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,250,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11724/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,251,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11725/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,251,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11726/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=2,251,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11727/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,251,584,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11728/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,251,776,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11729/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,251,968,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11730/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=2,252,160,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11731/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=2,252,352,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11732/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,252,544,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11733/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,252,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11734/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=2,252,928,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11735/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,253,120,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11736/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=2,253,312,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11737/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,253,504,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11738/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,253,696,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11739/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,253,888,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11740/500000]
+ optim/total_grad_norm=0.8704
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,254,080,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11741/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,254,272,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11742/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=2,254,464,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11743/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,254,656,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11744/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,254,848,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11745/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,255,040,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11746/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,255,232,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11747/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,255,424,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11748/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,255,616,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11749/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,255,808,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11750/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,256,000,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11751/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=2,256,192,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11752/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,256,384,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11753/500000]
+ train/ActionNoiseL2Loss=0.0089
+ throughput/total_tokens=2,256,576,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11754/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,256,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11755/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,256,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11756/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,257,152,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11757/500000]
+ train/ActionNoiseL2Loss=0.0106
+ throughput/total_tokens=2,257,344,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11758/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,257,536,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11759/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,257,728,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11760/500000]
+ optim/total_grad_norm=0.8588
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,257,920,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11761/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,258,112,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11762/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=2,258,304,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11763/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,258,496,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11764/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=2,258,688,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11765/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,258,880,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11766/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,259,072,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11767/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,259,264,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11768/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,259,456,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11769/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=2,259,648,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11770/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,259,840,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11771/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,260,032,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11772/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,260,224,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11773/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,260,416,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11774/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,260,608,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11775/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=2,260,800,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11776/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,260,992,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11777/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=2,261,184,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11778/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,261,376,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11779/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,261,568,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11780/500000]
+ optim/total_grad_norm=0.8243
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,261,760,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11781/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=2,261,952,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11782/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,262,144,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11783/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,262,336,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11784/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,262,528,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11785/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=2,262,720,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11786/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,262,912,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11787/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=2,263,104,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11788/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,263,296,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11789/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,263,488,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11790/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=2,263,680,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11791/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,263,872,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11792/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,264,064,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11793/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,264,256,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11794/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=2,264,448,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11795/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,264,640,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11796/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,264,832,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11797/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,265,024,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11798/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,265,216,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11799/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,265,408,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11800/500000]
+ optim/total_grad_norm=1.434
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,265,600,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11801/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,265,792,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=11802/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,265,984,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=11803/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,266,176,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=11804/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,266,368,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11805/500000]
+ train/ActionNoiseL2Loss=0.0080
+ throughput/total_tokens=2,266,560,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11806/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,266,752,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11807/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=2,266,944,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11808/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,267,136,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11809/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,267,328,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11810/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=2,267,520,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,437
+[step=11811/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,267,712,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11812/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,267,904,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11813/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=2,268,096,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11814/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=2,268,288,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=11815/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,268,480,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=11816/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=2,268,672,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=11817/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,268,864,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=11818/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,269,056,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=11819/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,269,248,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=11820/500000]
+ optim/total_grad_norm=0.9260
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,269,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11821/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=2,269,632,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11822/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=2,269,824,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11823/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,270,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11824/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=2,270,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=11825/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=2,270,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11826/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=2,270,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11827/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=2,270,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11828/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=2,270,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11829/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,271,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11830/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=2,271,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11831/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,271,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11832/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=2,271,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11833/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=2,271,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11834/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,272,128,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11835/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=2,272,320,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11836/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,272,512,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11837/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=2,272,704,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11838/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,272,896,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11839/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,273,088,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11840/500000]
+ optim/total_grad_norm=1.309
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,273,280,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11841/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,273,472,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11842/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=2,273,664,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11843/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,273,856,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11844/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=2,274,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11845/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,274,240,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11846/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=2,274,432,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11847/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,274,624,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11848/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,274,816,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11849/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=2,275,008,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11850/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,275,200,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11851/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,275,392,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11852/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,275,584,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0470
+[step=11853/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,275,776,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11854/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,275,968,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11855/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,276,160,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11856/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=2,276,352,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11857/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,276,544,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11858/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,276,736,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11859/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,276,928,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11860/500000]
+ optim/total_grad_norm=0.8520
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,277,120,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11861/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,277,312,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11862/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,277,504,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11863/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=2,277,696,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11864/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=2,277,888,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11865/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,278,080,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11866/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,278,272,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11867/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,278,464,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11868/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,278,656,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11869/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,278,848,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11870/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,279,040,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11871/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,279,232,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11872/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,279,424,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11873/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,279,616,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11874/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,279,808,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11875/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=2,280,000,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11876/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=2,280,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11877/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,280,384,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11878/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=2,280,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11879/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,280,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11880/500000]
+ optim/total_grad_norm=0.8356
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,280,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11881/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,281,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11882/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,281,344,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11883/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,281,536,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11884/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,281,728,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11885/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,281,920,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11886/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,282,112,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11887/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,282,304,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11888/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,282,496,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11889/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,282,688,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11890/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=2,282,880,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11891/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,283,072,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11892/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,283,264,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11893/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=2,283,456,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11894/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,283,648,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11895/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,283,840,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11896/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=2,284,032,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11897/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,284,224,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11898/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,284,416,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11899/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=2,284,608,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11900/500000]
+ optim/total_grad_norm=0.7039
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,284,800,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11901/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,284,992,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11902/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=2,285,184,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11903/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,285,376,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11904/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,285,568,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11905/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,285,760,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11906/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,285,952,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11907/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,286,144,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11908/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,286,336,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11909/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,286,528,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11910/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,286,720,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11911/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,286,912,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11912/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=2,287,104,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11913/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,287,296,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11914/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,287,488,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11915/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,287,680,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=11916/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,287,872,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11917/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=2,288,064,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11918/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,288,256,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11919/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,288,448,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=11920/500000]
+ optim/total_grad_norm=0.6873
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,288,640,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11921/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,288,832,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11922/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=2,289,024,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11923/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,289,216,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11924/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,289,408,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11925/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,289,600,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11926/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,289,792,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11927/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,289,984,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11928/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,290,176,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11929/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,290,368,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11930/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=2,290,560,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11931/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,290,752,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11932/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,290,944,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11933/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,291,136,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11934/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,291,328,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11935/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,291,520,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11936/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,291,712,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11937/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,291,904,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11938/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,292,096,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11939/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,292,288,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11940/500000]
+ optim/total_grad_norm=0.7939
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,292,480,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11941/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,292,672,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11942/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,292,864,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11943/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,293,056,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11944/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=2,293,248,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=11945/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,293,440,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11946/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=2,293,632,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11947/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,293,824,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11948/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,294,016,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11949/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,294,208,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11950/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,294,400,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11951/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,294,592,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11952/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,294,784,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11953/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,294,976,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11954/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,295,168,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11955/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,295,360,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11956/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,295,552,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11957/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,295,744,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11958/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,295,936,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11959/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,296,128,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11960/500000]
+ optim/total_grad_norm=0.9155
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,296,320,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+ System/Peak GPU Memory (MB)=44,437
+[step=11961/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,296,512,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11962/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,296,704,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11963/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=2,296,896,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11964/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,297,088,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11965/500000]
+ train/ActionNoiseL2Loss=0.0122
+ throughput/total_tokens=2,297,280,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11966/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,297,472,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11967/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,297,664,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11968/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,297,856,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11969/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=2,298,048,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=11970/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,298,240,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=44,437
+[step=11971/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,298,432,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11972/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,298,624,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11973/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=2,298,816,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11974/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,299,008,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11975/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,299,200,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11976/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,299,392,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=11977/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,299,584,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11978/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,299,776,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11979/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=2,299,968,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11980/500000]
+ optim/total_grad_norm=0.9258
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,300,160,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=44,437
+[step=11981/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,300,352,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11982/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,300,544,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11983/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,300,736,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11984/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,300,928,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=11985/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,301,120,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/requirements.txt b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..d591dba0016b7c501858d0d2d84d7b27acfff58c
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/requirements.txt
@@ -0,0 +1,285 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+tensorflow-rocm==2.16.2
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/wandb-metadata.json b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..9b8917aee0d4874c0427e3388a886d41e8b08abe
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-24T08:24:16.439204Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "1600",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "c13f2763af61e0d729a8b5ab4bdefc512205bcc5"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-311",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50233278464"
+ }
+ },
+ "memory": {
+ "total": "2434606952448"
+ },
+ "gpu_amd": [
+ {
+ "id": "1",
+ "uniqueId": "0xfc6ffa890311d155",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x3c6dd21e6c9dcdcd",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x42899199aa6191e",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xd4b6b7007198f17b",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x43c043ea6952a445",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0x6770855728ded71b",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0xeb2d43fc31d036dc",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xf6d46069b47c33f6",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1758961395",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1623",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-311",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1758702195",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1623",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-311",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "3323380",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-311",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "t1ahnsccez1z37lkaaofi96iryft2eo9"
+}
\ No newline at end of file
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/logs/debug-core.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..6bf2ddc53af9e1d0a24bc18dd31c7c303fa53329
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/logs/debug-core.log
@@ -0,0 +1,6 @@
+{"time":"2025-09-24T08:24:16.660480914Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp53wcxeju/port-3323461.txt","pid":3323461,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-24T08:24:16.662271854Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3323461}
+{"time":"2025-09-24T08:24:16.662230713Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3323461-3323638-1579542534/socket","Net":"unix"}}
+{"time":"2025-09-24T08:24:16.694281303Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-24T08:24:16.703433882Z","level":"INFO","msg":"handleInformInit: received","streamId":"4dp69fok","id":"1(@)"}
+{"time":"2025-09-24T08:24:17.754484882Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"4dp69fok","id":"1(@)"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/logs/debug-internal.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..e84c27228092453f22934b1211aa4706f57edff5
--- /dev/null
+++ b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/logs/debug-internal.log
@@ -0,0 +1,13 @@
+{"time":"2025-09-24T08:24:16.705237241Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-24T08:24:17.754431561Z","level":"INFO","msg":"stream: created new stream","id":"4dp69fok"}
+{"time":"2025-09-24T08:24:17.754478082Z","level":"INFO","msg":"stream: started","id":"4dp69fok"}
+{"time":"2025-09-24T08:24:17.754498402Z","level":"INFO","msg":"sender: started","stream_id":"4dp69fok"}
+{"time":"2025-09-24T08:24:17.754506202Z","level":"INFO","msg":"writer: started","stream_id":"4dp69fok"}
+{"time":"2025-09-24T08:24:17.754546793Z","level":"INFO","msg":"handler: started","stream_id":"4dp69fok"}
+{"time":"2025-09-24T15:15:45.267501791Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-09-24T20:24:27.534186056Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-09-25T23:01:28.093149981Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-09-26T02:33:15.940926228Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/4dp69fok/file_stream","body":"\n\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
+{"time":"2025-09-26T19:36:48.428667728Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/4dp69fok/file_stream","body":"\n\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
+{"time":"2025-09-26T20:06:50.687851553Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-09-26T20:59:26.86775551Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
diff --git a/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/logs/debug.log b/all_flow_matching/glue_best/wandb/wandb/run-20250924_082416-4dp69fok/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/step11500-action-head/metadata.pt b/all_flow_matching/step11500-action-head/metadata.pt
new file mode 100644
index 0000000000000000000000000000000000000000..4e34304d65d6217c2b0a33ee0a75ccecc5e8f82c
--- /dev/null
+++ b/all_flow_matching/step11500-action-head/metadata.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7fb72b6306ce04d1beb20bb289509f00c39a40845ff7c4b36bf4deb4e83fe82a
+size 1331
diff --git a/all_flow_matching/step12000-action-head/metadata.pt b/all_flow_matching/step12000-action-head/metadata.pt
new file mode 100644
index 0000000000000000000000000000000000000000..752c8b547c4cac7f78746ac5066032167b1cf3c1
--- /dev/null
+++ b/all_flow_matching/step12000-action-head/metadata.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:995307502120af3866f237cd0bc484fc848a652539d28e53cbea882abc16ba6b
+size 1331
diff --git a/all_flow_matching/step12000-unsharded/config.yaml b/all_flow_matching/step12000-unsharded/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..fc3198c411bd4cea3c4ae243f476aad3f5428d98
--- /dev/null
+++ b/all_flow_matching/step12000-unsharded/config.yaml
@@ -0,0 +1,322 @@
+run_name: all_20251002_164508
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ ff_out_size: null
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ action_tokenizer:
+ identifier: physical-intelligence/fast
+ tokenizer_dir: null
+ action_dim: 7
+ horizon: 8
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: flow_matching
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: true
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: true
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: true
+lora_rank: 8
+lora_llm: false
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Wipe
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/all_flow_matching
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: all_20251002_164508
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/all_flow_matching/step12000-unsharded/lora.pt b/all_flow_matching/step12000-unsharded/lora.pt
new file mode 100644
index 0000000000000000000000000000000000000000..d3eb8fc48e155d8229340760896a20ba9fc413e2
--- /dev/null
+++ b/all_flow_matching/step12000-unsharded/lora.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b09055f15a54dd092b4dd30833406731057005822da0c55c16231cf2e68f7f6
+size 1243
diff --git a/all_flow_matching/step12000-unsharded/train.pt b/all_flow_matching/step12000-unsharded/train.pt
new file mode 100644
index 0000000000000000000000000000000000000000..579d4bb116ed7276b99d526ba8c4edf08dd60e1e
--- /dev/null
+++ b/all_flow_matching/step12000-unsharded/train.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0675538ed663c987b6011099fdfd14d35634f2eafa70e09c30e2c1d93e3b6e21
+size 15061
diff --git a/all_flow_matching/step12000/config.yaml b/all_flow_matching/step12000/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..fc3198c411bd4cea3c4ae243f476aad3f5428d98
--- /dev/null
+++ b/all_flow_matching/step12000/config.yaml
@@ -0,0 +1,322 @@
+run_name: all_20251002_164508
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ ff_out_size: null
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ action_tokenizer:
+ identifier: physical-intelligence/fast
+ tokenizer_dir: null
+ action_dim: 7
+ horizon: 8
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: flow_matching
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: true
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: true
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: true
+lora_rank: 8
+lora_llm: false
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Wipe
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/all_flow_matching
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: all_20251002_164508
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/all_flow_matching/wandb/wandb/debug-internal.log b/all_flow_matching/wandb/wandb/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..46bb34f26df4f2aeb63b46b2f2a8239758de40aa
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/debug-internal.log
@@ -0,0 +1,8 @@
+{"time":"2025-10-02T16:45:38.466053735Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:45:39.489216309Z","level":"INFO","msg":"stream: created new stream","id":"si5wp17t"}
+{"time":"2025-10-02T16:45:39.48927263Z","level":"INFO","msg":"stream: started","id":"si5wp17t"}
+{"time":"2025-10-02T16:45:39.48928615Z","level":"INFO","msg":"writer: started","stream_id":"si5wp17t"}
+{"time":"2025-10-02T16:45:39.48930321Z","level":"INFO","msg":"sender: started","stream_id":"si5wp17t"}
+{"time":"2025-10-02T16:45:39.489330791Z","level":"INFO","msg":"handler: started","stream_id":"si5wp17t"}
+{"time":"2025-10-03T17:19:10.628180203Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/si5wp17t/file_stream","body":"\n\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
+{"time":"2025-10-04T16:32:25.479544416Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"}
diff --git a/all_flow_matching/wandb/wandb/debug.log b/all_flow_matching/wandb/wandb/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/output.log b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..e2e92787d291a57ae5c6e244745d637d4c8644e4
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/output.log
@@ -0,0 +1,25784 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+09/28 [10:46:57] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk', 0.1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk50', 0.1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Eraser', 0.1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue', 0.1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Pen', 0.1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_StickyNote', 0.1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Test_Glue', 0.1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Wipe', 0.1, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 0.1, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 0.1, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+09/28 [10:47:04] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:128
+09/28 [10:47:05] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk
+Downloading data: 100%|██████████| 109/109 [00:00<00:00, 21695.02files/s]
+Generating train split: 72641 examples [00:44, 1628.53 examples/s]
+****** length of the dataset: 72641
+09/28 [10:47:58] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk50
+****** length of the dataset: 27906
+09/28 [10:48:22] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Eraser
+****** length of the dataset: 13441
+09/28 [10:48:37] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+****** length of the dataset: 10316
+09/28 [10:48:48] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Pen
+****** length of the dataset: 17131
+09/28 [10:49:03] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_StickyNote
+****** length of the dataset: 15765
+09/28 [10:49:18] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Test_Glue
+****** length of the dataset: 90
+ INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:434
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Wipe
+****** length of the dataset: 18397
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: [, , , , , , , ]
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+09/28 [10:49:38] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=True, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Add lora to model.transformer successful!
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* get lora params name: llm_params[0]: blocks.18._fsdp_wrapped_module.ff_proj.parametrizations.weight.0.lora_B
+************* After get lora params successfully
+09/28 [10:51:11] INFO | >> Constructing optimizer with 1 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 39071
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=39,071
+09/28 [10:51:12] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+09/28 [10:51:19] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109
+ of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed
+ want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor
+ by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered
+ internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.)
+ param_grad = param.grad
+
+[step=1/500000]
+ train/ActionNoiseL2Loss=1.754
+ throughput/total_tokens=192,000
+ System/Peak GPU Memory (MB)=43,919
+[step=2/500000]
+ train/ActionNoiseL2Loss=1.721
+ throughput/total_tokens=384,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=44,538
+[step=3/500000]
+ train/ActionNoiseL2Loss=1.817
+ throughput/total_tokens=576,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=4/500000]
+ train/ActionNoiseL2Loss=1.829
+ throughput/total_tokens=768,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=5/500000]
+ train/ActionNoiseL2Loss=1.685
+ throughput/total_tokens=960,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=6/500000]
+ train/ActionNoiseL2Loss=1.671
+ throughput/total_tokens=1,152,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=7/500000]
+ train/ActionNoiseL2Loss=1.799
+ throughput/total_tokens=1,344,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=8/500000]
+ train/ActionNoiseL2Loss=1.743
+ throughput/total_tokens=1,536,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=9/500000]
+ train/ActionNoiseL2Loss=1.619
+ throughput/total_tokens=1,728,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=10/500000]
+ train/ActionNoiseL2Loss=1.587
+ throughput/total_tokens=1,920,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=11/500000]
+ train/ActionNoiseL2Loss=1.592
+ throughput/total_tokens=2,112,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=12/500000]
+ train/ActionNoiseL2Loss=1.625
+ throughput/total_tokens=2,304,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=13/500000]
+ train/ActionNoiseL2Loss=1.467
+ throughput/total_tokens=2,496,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=14/500000]
+ train/ActionNoiseL2Loss=1.567
+ throughput/total_tokens=2,688,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=15/500000]
+ train/ActionNoiseL2Loss=1.523
+ throughput/total_tokens=2,880,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=16/500000]
+ train/ActionNoiseL2Loss=1.647
+ throughput/total_tokens=3,072,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=17/500000]
+ train/ActionNoiseL2Loss=1.480
+ throughput/total_tokens=3,264,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=18/500000]
+ train/ActionNoiseL2Loss=1.561
+ throughput/total_tokens=3,456,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=19/500000]
+ train/ActionNoiseL2Loss=1.405
+ throughput/total_tokens=3,648,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=20/500000]
+ optim/total_grad_norm=18.02
+ train/ActionNoiseL2Loss=1.467
+ throughput/total_tokens=3,840,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,538
+[step=21/500000]
+ train/ActionNoiseL2Loss=1.575
+ throughput/total_tokens=4,032,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=22/500000]
+ train/ActionNoiseL2Loss=1.415
+ throughput/total_tokens=4,224,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=23/500000]
+ train/ActionNoiseL2Loss=1.389
+ throughput/total_tokens=4,416,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=24/500000]
+ train/ActionNoiseL2Loss=1.531
+ throughput/total_tokens=4,608,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=25/500000]
+ train/ActionNoiseL2Loss=1.371
+ throughput/total_tokens=4,800,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=26/500000]
+ train/ActionNoiseL2Loss=1.460
+ throughput/total_tokens=4,992,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=27/500000]
+ train/ActionNoiseL2Loss=1.547
+ throughput/total_tokens=5,184,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=28/500000]
+ train/ActionNoiseL2Loss=1.504
+ throughput/total_tokens=5,376,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=29/500000]
+ train/ActionNoiseL2Loss=1.567
+ throughput/total_tokens=5,568,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=30/500000]
+ train/ActionNoiseL2Loss=1.364
+ throughput/total_tokens=5,760,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=31/500000]
+ train/ActionNoiseL2Loss=1.428
+ throughput/total_tokens=5,952,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=32/500000]
+ train/ActionNoiseL2Loss=1.268
+ throughput/total_tokens=6,144,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=33/500000]
+ train/ActionNoiseL2Loss=1.406
+ throughput/total_tokens=6,336,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=34/500000]
+ train/ActionNoiseL2Loss=1.427
+ throughput/total_tokens=6,528,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=35/500000]
+ train/ActionNoiseL2Loss=1.308
+ throughput/total_tokens=6,720,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=36/500000]
+ train/ActionNoiseL2Loss=1.398
+ throughput/total_tokens=6,912,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=37/500000]
+ train/ActionNoiseL2Loss=1.248
+ throughput/total_tokens=7,104,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=38/500000]
+ train/ActionNoiseL2Loss=1.287
+ throughput/total_tokens=7,296,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=39/500000]
+ train/ActionNoiseL2Loss=1.352
+ throughput/total_tokens=7,488,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=40/500000]
+ optim/total_grad_norm=11.81
+ train/ActionNoiseL2Loss=1.244
+ throughput/total_tokens=7,680,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=41/500000]
+ train/ActionNoiseL2Loss=1.223
+ throughput/total_tokens=7,872,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=42/500000]
+ train/ActionNoiseL2Loss=1.257
+ throughput/total_tokens=8,064,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=43/500000]
+ train/ActionNoiseL2Loss=1.378
+ throughput/total_tokens=8,256,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=44/500000]
+ train/ActionNoiseL2Loss=1.444
+ throughput/total_tokens=8,448,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=45/500000]
+ train/ActionNoiseL2Loss=1.242
+ throughput/total_tokens=8,640,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=46/500000]
+ train/ActionNoiseL2Loss=1.213
+ throughput/total_tokens=8,832,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=47/500000]
+ train/ActionNoiseL2Loss=1.226
+ throughput/total_tokens=9,024,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=48/500000]
+ train/ActionNoiseL2Loss=1.227
+ throughput/total_tokens=9,216,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=49/500000]
+ train/ActionNoiseL2Loss=1.156
+ throughput/total_tokens=9,408,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=50/500000]
+ train/ActionNoiseL2Loss=1.232
+ throughput/total_tokens=9,600,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=51/500000]
+ train/ActionNoiseL2Loss=1.206
+ throughput/total_tokens=9,792,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=52/500000]
+ train/ActionNoiseL2Loss=1.174
+ throughput/total_tokens=9,984,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=53/500000]
+ train/ActionNoiseL2Loss=1.231
+ throughput/total_tokens=10,176,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=54/500000]
+ train/ActionNoiseL2Loss=1.217
+ throughput/total_tokens=10,368,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=55/500000]
+ train/ActionNoiseL2Loss=1.120
+ throughput/total_tokens=10,560,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=56/500000]
+ train/ActionNoiseL2Loss=1.189
+ throughput/total_tokens=10,752,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=57/500000]
+ train/ActionNoiseL2Loss=1.202
+ throughput/total_tokens=10,944,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=58/500000]
+ train/ActionNoiseL2Loss=1.174
+ throughput/total_tokens=11,136,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=59/500000]
+ train/ActionNoiseL2Loss=1.137
+ throughput/total_tokens=11,328,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=60/500000]
+ optim/total_grad_norm=15.05
+ train/ActionNoiseL2Loss=1.154
+ throughput/total_tokens=11,520,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=61/500000]
+ train/ActionNoiseL2Loss=1.171
+ throughput/total_tokens=11,712,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=62/500000]
+ train/ActionNoiseL2Loss=1.136
+ throughput/total_tokens=11,904,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=63/500000]
+ train/ActionNoiseL2Loss=1.069
+ throughput/total_tokens=12,096,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=64/500000]
+ train/ActionNoiseL2Loss=1.018
+ throughput/total_tokens=12,288,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=65/500000]
+ train/ActionNoiseL2Loss=1.148
+ throughput/total_tokens=12,480,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=66/500000]
+ train/ActionNoiseL2Loss=1.122
+ throughput/total_tokens=12,672,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=67/500000]
+ train/ActionNoiseL2Loss=1.061
+ throughput/total_tokens=12,864,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=68/500000]
+ train/ActionNoiseL2Loss=1.180
+ throughput/total_tokens=13,056,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=69/500000]
+ train/ActionNoiseL2Loss=1.076
+ throughput/total_tokens=13,248,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=70/500000]
+ train/ActionNoiseL2Loss=0.9982
+ throughput/total_tokens=13,440,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=71/500000]
+ train/ActionNoiseL2Loss=1.056
+ throughput/total_tokens=13,632,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=72/500000]
+ train/ActionNoiseL2Loss=0.9978
+ throughput/total_tokens=13,824,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=73/500000]
+ train/ActionNoiseL2Loss=1.048
+ throughput/total_tokens=14,016,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=74/500000]
+ train/ActionNoiseL2Loss=1.049
+ throughput/total_tokens=14,208,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=75/500000]
+ train/ActionNoiseL2Loss=1.006
+ throughput/total_tokens=14,400,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=76/500000]
+ train/ActionNoiseL2Loss=0.9742
+ throughput/total_tokens=14,592,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=77/500000]
+ train/ActionNoiseL2Loss=0.9389
+ throughput/total_tokens=14,784,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=78/500000]
+ train/ActionNoiseL2Loss=1.040
+ throughput/total_tokens=14,976,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=79/500000]
+ train/ActionNoiseL2Loss=1.148
+ throughput/total_tokens=15,168,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=80/500000]
+ optim/total_grad_norm=12.96
+ train/ActionNoiseL2Loss=0.9517
+ throughput/total_tokens=15,360,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=81/500000]
+ train/ActionNoiseL2Loss=1.162
+ throughput/total_tokens=15,552,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=82/500000]
+ train/ActionNoiseL2Loss=1.051
+ throughput/total_tokens=15,744,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=83/500000]
+ train/ActionNoiseL2Loss=1.100
+ throughput/total_tokens=15,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=84/500000]
+ train/ActionNoiseL2Loss=1.114
+ throughput/total_tokens=16,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=85/500000]
+ train/ActionNoiseL2Loss=1.183
+ throughput/total_tokens=16,320,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=86/500000]
+ train/ActionNoiseL2Loss=0.9630
+ throughput/total_tokens=16,512,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=87/500000]
+ train/ActionNoiseL2Loss=1.010
+ throughput/total_tokens=16,704,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=88/500000]
+ train/ActionNoiseL2Loss=0.9832
+ throughput/total_tokens=16,896,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=89/500000]
+ train/ActionNoiseL2Loss=1.098
+ throughput/total_tokens=17,088,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=90/500000]
+ train/ActionNoiseL2Loss=0.8765
+ throughput/total_tokens=17,280,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=91/500000]
+ train/ActionNoiseL2Loss=1.018
+ throughput/total_tokens=17,472,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=92/500000]
+ train/ActionNoiseL2Loss=0.9873
+ throughput/total_tokens=17,664,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=93/500000]
+ train/ActionNoiseL2Loss=0.9625
+ throughput/total_tokens=17,856,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=94/500000]
+ train/ActionNoiseL2Loss=0.9012
+ throughput/total_tokens=18,048,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=95/500000]
+ train/ActionNoiseL2Loss=0.9873
+ throughput/total_tokens=18,240,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=96/500000]
+ train/ActionNoiseL2Loss=0.9873
+ throughput/total_tokens=18,432,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=97/500000]
+ train/ActionNoiseL2Loss=0.8499
+ throughput/total_tokens=18,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=98/500000]
+ train/ActionNoiseL2Loss=1.144
+ throughput/total_tokens=18,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=99/500000]
+ train/ActionNoiseL2Loss=0.8784
+ throughput/total_tokens=19,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=100/500000]
+ optim/total_grad_norm=13.28
+ train/ActionNoiseL2Loss=0.9532
+ throughput/total_tokens=19,200,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=101/500000]
+ train/ActionNoiseL2Loss=0.9440
+ throughput/total_tokens=19,392,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=102/500000]
+ train/ActionNoiseL2Loss=0.9241
+ throughput/total_tokens=19,584,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=103/500000]
+ train/ActionNoiseL2Loss=0.8683
+ throughput/total_tokens=19,776,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=104/500000]
+ train/ActionNoiseL2Loss=0.9848
+ throughput/total_tokens=19,968,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=105/500000]
+ train/ActionNoiseL2Loss=1.025
+ throughput/total_tokens=20,160,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=106/500000]
+ train/ActionNoiseL2Loss=0.9704
+ throughput/total_tokens=20,352,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=107/500000]
+ train/ActionNoiseL2Loss=0.9373
+ throughput/total_tokens=20,544,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=108/500000]
+ train/ActionNoiseL2Loss=1.023
+ throughput/total_tokens=20,736,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=109/500000]
+ train/ActionNoiseL2Loss=0.8805
+ throughput/total_tokens=20,928,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=110/500000]
+ train/ActionNoiseL2Loss=0.7717
+ throughput/total_tokens=21,120,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=111/500000]
+ train/ActionNoiseL2Loss=0.8106
+ throughput/total_tokens=21,312,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=112/500000]
+ train/ActionNoiseL2Loss=1.012
+ throughput/total_tokens=21,504,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=113/500000]
+ train/ActionNoiseL2Loss=0.9313
+ throughput/total_tokens=21,696,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=114/500000]
+ train/ActionNoiseL2Loss=1.011
+ throughput/total_tokens=21,888,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=115/500000]
+ train/ActionNoiseL2Loss=1.005
+ throughput/total_tokens=22,080,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=116/500000]
+ train/ActionNoiseL2Loss=0.8261
+ throughput/total_tokens=22,272,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=117/500000]
+ train/ActionNoiseL2Loss=0.9501
+ throughput/total_tokens=22,464,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=118/500000]
+ train/ActionNoiseL2Loss=1.062
+ throughput/total_tokens=22,656,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=119/500000]
+ train/ActionNoiseL2Loss=0.8693
+ throughput/total_tokens=22,848,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=120/500000]
+ optim/total_grad_norm=17.84
+ train/ActionNoiseL2Loss=1.039
+ throughput/total_tokens=23,040,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=121/500000]
+ train/ActionNoiseL2Loss=0.8773
+ throughput/total_tokens=23,232,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=122/500000]
+ train/ActionNoiseL2Loss=1.014
+ throughput/total_tokens=23,424,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=123/500000]
+ train/ActionNoiseL2Loss=0.9666
+ throughput/total_tokens=23,616,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=124/500000]
+ train/ActionNoiseL2Loss=0.9646
+ throughput/total_tokens=23,808,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=125/500000]
+ train/ActionNoiseL2Loss=0.8647
+ throughput/total_tokens=24,000,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=126/500000]
+ train/ActionNoiseL2Loss=0.9192
+ throughput/total_tokens=24,192,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=127/500000]
+ train/ActionNoiseL2Loss=0.8185
+ throughput/total_tokens=24,384,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=128/500000]
+ train/ActionNoiseL2Loss=1.172
+ throughput/total_tokens=24,576,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=129/500000]
+ train/ActionNoiseL2Loss=0.9160
+ throughput/total_tokens=24,768,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=130/500000]
+ train/ActionNoiseL2Loss=0.8064
+ throughput/total_tokens=24,960,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=131/500000]
+ train/ActionNoiseL2Loss=1.085
+ throughput/total_tokens=25,152,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=132/500000]
+ train/ActionNoiseL2Loss=0.8301
+ throughput/total_tokens=25,344,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=133/500000]
+ train/ActionNoiseL2Loss=1.033
+ throughput/total_tokens=25,536,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=134/500000]
+ train/ActionNoiseL2Loss=0.9440
+ throughput/total_tokens=25,728,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=135/500000]
+ train/ActionNoiseL2Loss=0.9074
+ throughput/total_tokens=25,920,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=136/500000]
+ train/ActionNoiseL2Loss=0.8927
+ throughput/total_tokens=26,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=137/500000]
+ train/ActionNoiseL2Loss=0.9290
+ throughput/total_tokens=26,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=138/500000]
+ train/ActionNoiseL2Loss=0.8975
+ throughput/total_tokens=26,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=139/500000]
+ train/ActionNoiseL2Loss=0.7815
+ throughput/total_tokens=26,688,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=140/500000]
+ optim/total_grad_norm=12.60
+ train/ActionNoiseL2Loss=0.9791
+ throughput/total_tokens=26,880,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=141/500000]
+ train/ActionNoiseL2Loss=0.7799
+ throughput/total_tokens=27,072,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=142/500000]
+ train/ActionNoiseL2Loss=0.8617
+ throughput/total_tokens=27,264,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=143/500000]
+ train/ActionNoiseL2Loss=0.9488
+ throughput/total_tokens=27,456,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=144/500000]
+ train/ActionNoiseL2Loss=0.9250
+ throughput/total_tokens=27,648,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=145/500000]
+ train/ActionNoiseL2Loss=1.036
+ throughput/total_tokens=27,840,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=146/500000]
+ train/ActionNoiseL2Loss=0.8911
+ throughput/total_tokens=28,032,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=147/500000]
+ train/ActionNoiseL2Loss=0.8062
+ throughput/total_tokens=28,224,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=148/500000]
+ train/ActionNoiseL2Loss=0.8709
+ throughput/total_tokens=28,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=149/500000]
+ train/ActionNoiseL2Loss=0.8187
+ throughput/total_tokens=28,608,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=150/500000]
+ train/ActionNoiseL2Loss=0.7815
+ throughput/total_tokens=28,800,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=151/500000]
+ train/ActionNoiseL2Loss=0.8030
+ throughput/total_tokens=28,992,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=152/500000]
+ train/ActionNoiseL2Loss=0.8464
+ throughput/total_tokens=29,184,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=153/500000]
+ train/ActionNoiseL2Loss=0.8272
+ throughput/total_tokens=29,376,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=154/500000]
+ train/ActionNoiseL2Loss=0.9214
+ throughput/total_tokens=29,568,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=155/500000]
+ train/ActionNoiseL2Loss=0.9015
+ throughput/total_tokens=29,760,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=156/500000]
+ train/ActionNoiseL2Loss=0.8983
+ throughput/total_tokens=29,952,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=157/500000]
+ train/ActionNoiseL2Loss=1.002
+ throughput/total_tokens=30,144,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=158/500000]
+ train/ActionNoiseL2Loss=0.7627
+ throughput/total_tokens=30,336,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=159/500000]
+ train/ActionNoiseL2Loss=0.8012
+ throughput/total_tokens=30,528,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=160/500000]
+ optim/total_grad_norm=13.08
+ train/ActionNoiseL2Loss=0.8558
+ throughput/total_tokens=30,720,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=161/500000]
+ train/ActionNoiseL2Loss=0.8068
+ throughput/total_tokens=30,912,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=162/500000]
+ train/ActionNoiseL2Loss=0.8921
+ throughput/total_tokens=31,104,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=163/500000]
+ train/ActionNoiseL2Loss=0.8412
+ throughput/total_tokens=31,296,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=164/500000]
+ train/ActionNoiseL2Loss=0.9908
+ throughput/total_tokens=31,488,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=165/500000]
+ train/ActionNoiseL2Loss=0.8452
+ throughput/total_tokens=31,680,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=166/500000]
+ train/ActionNoiseL2Loss=0.8796
+ throughput/total_tokens=31,872,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=167/500000]
+ train/ActionNoiseL2Loss=0.8352
+ throughput/total_tokens=32,064,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=168/500000]
+ train/ActionNoiseL2Loss=0.8859
+ throughput/total_tokens=32,256,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=169/500000]
+ train/ActionNoiseL2Loss=0.8173
+ throughput/total_tokens=32,448,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=170/500000]
+ train/ActionNoiseL2Loss=0.8411
+ throughput/total_tokens=32,640,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=171/500000]
+ train/ActionNoiseL2Loss=0.8269
+ throughput/total_tokens=32,832,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=172/500000]
+ train/ActionNoiseL2Loss=0.6627
+ throughput/total_tokens=33,024,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=173/500000]
+ train/ActionNoiseL2Loss=0.7728
+ throughput/total_tokens=33,216,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=174/500000]
+ train/ActionNoiseL2Loss=0.8470
+ throughput/total_tokens=33,408,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=175/500000]
+ train/ActionNoiseL2Loss=0.9638
+ throughput/total_tokens=33,600,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=176/500000]
+ train/ActionNoiseL2Loss=0.7728
+ throughput/total_tokens=33,792,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=177/500000]
+ train/ActionNoiseL2Loss=0.8040
+ throughput/total_tokens=33,984,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=178/500000]
+ train/ActionNoiseL2Loss=0.9564
+ throughput/total_tokens=34,176,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=179/500000]
+ train/ActionNoiseL2Loss=0.7940
+ throughput/total_tokens=34,368,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=180/500000]
+ optim/total_grad_norm=10.42
+ train/ActionNoiseL2Loss=0.7037
+ throughput/total_tokens=34,560,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=181/500000]
+ train/ActionNoiseL2Loss=0.7450
+ throughput/total_tokens=34,752,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=182/500000]
+ train/ActionNoiseL2Loss=0.8312
+ throughput/total_tokens=34,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=183/500000]
+ train/ActionNoiseL2Loss=0.8820
+ throughput/total_tokens=35,136,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=184/500000]
+ train/ActionNoiseL2Loss=0.8560
+ throughput/total_tokens=35,328,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=185/500000]
+ train/ActionNoiseL2Loss=0.7487
+ throughput/total_tokens=35,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=186/500000]
+ train/ActionNoiseL2Loss=0.7105
+ throughput/total_tokens=35,712,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=187/500000]
+ train/ActionNoiseL2Loss=0.7155
+ throughput/total_tokens=35,904,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=188/500000]
+ train/ActionNoiseL2Loss=0.7235
+ throughput/total_tokens=36,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=189/500000]
+ train/ActionNoiseL2Loss=0.9406
+ throughput/total_tokens=36,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=190/500000]
+ train/ActionNoiseL2Loss=0.8124
+ throughput/total_tokens=36,480,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=191/500000]
+ train/ActionNoiseL2Loss=0.8098
+ throughput/total_tokens=36,672,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=192/500000]
+ train/ActionNoiseL2Loss=0.8286
+ throughput/total_tokens=36,864,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=193/500000]
+ train/ActionNoiseL2Loss=0.7590
+ throughput/total_tokens=37,056,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=194/500000]
+ train/ActionNoiseL2Loss=0.9254
+ throughput/total_tokens=37,248,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=195/500000]
+ train/ActionNoiseL2Loss=0.9061
+ throughput/total_tokens=37,440,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=196/500000]
+ train/ActionNoiseL2Loss=0.7591
+ throughput/total_tokens=37,632,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=197/500000]
+ train/ActionNoiseL2Loss=0.7776
+ throughput/total_tokens=37,824,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=198/500000]
+ train/ActionNoiseL2Loss=0.7689
+ throughput/total_tokens=38,016,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=199/500000]
+ train/ActionNoiseL2Loss=0.7935
+ throughput/total_tokens=38,208,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=200/500000]
+ optim/total_grad_norm=31.32
+ train/ActionNoiseL2Loss=0.8211
+ throughput/total_tokens=38,400,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=201/500000]
+ train/ActionNoiseL2Loss=0.8033
+ throughput/total_tokens=38,592,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=202/500000]
+ train/ActionNoiseL2Loss=0.8782
+ throughput/total_tokens=38,784,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=203/500000]
+ train/ActionNoiseL2Loss=0.7554
+ throughput/total_tokens=38,976,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=204/500000]
+ train/ActionNoiseL2Loss=0.7406
+ throughput/total_tokens=39,168,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=205/500000]
+ train/ActionNoiseL2Loss=0.7410
+ throughput/total_tokens=39,360,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=206/500000]
+ train/ActionNoiseL2Loss=0.7674
+ throughput/total_tokens=39,552,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=207/500000]
+ train/ActionNoiseL2Loss=0.9770
+ throughput/total_tokens=39,744,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=208/500000]
+ train/ActionNoiseL2Loss=0.8240
+ throughput/total_tokens=39,936,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=209/500000]
+ train/ActionNoiseL2Loss=0.7339
+ throughput/total_tokens=40,128,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=210/500000]
+ train/ActionNoiseL2Loss=0.7460
+ throughput/total_tokens=40,320,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,538
+[step=211/500000]
+ train/ActionNoiseL2Loss=0.7627
+ throughput/total_tokens=40,512,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=212/500000]
+ train/ActionNoiseL2Loss=0.6886
+ throughput/total_tokens=40,704,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=213/500000]
+ train/ActionNoiseL2Loss=0.6372
+ throughput/total_tokens=40,896,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=214/500000]
+ train/ActionNoiseL2Loss=0.5400
+ throughput/total_tokens=41,088,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=215/500000]
+ train/ActionNoiseL2Loss=0.7742
+ throughput/total_tokens=41,280,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=216/500000]
+ train/ActionNoiseL2Loss=0.8200
+ throughput/total_tokens=41,472,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=217/500000]
+ train/ActionNoiseL2Loss=0.7195
+ throughput/total_tokens=41,664,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=218/500000]
+ train/ActionNoiseL2Loss=0.7733
+ throughput/total_tokens=41,856,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=219/500000]
+ train/ActionNoiseL2Loss=0.7435
+ throughput/total_tokens=42,048,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=220/500000]
+ optim/total_grad_norm=17.02
+ train/ActionNoiseL2Loss=0.8552
+ throughput/total_tokens=42,240,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=221/500000]
+ train/ActionNoiseL2Loss=0.6981
+ throughput/total_tokens=42,432,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=222/500000]
+ train/ActionNoiseL2Loss=0.6329
+ throughput/total_tokens=42,624,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=223/500000]
+ train/ActionNoiseL2Loss=0.6483
+ throughput/total_tokens=42,816,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=224/500000]
+ train/ActionNoiseL2Loss=0.5920
+ throughput/total_tokens=43,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=225/500000]
+ train/ActionNoiseL2Loss=0.6834
+ throughput/total_tokens=43,200,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=226/500000]
+ train/ActionNoiseL2Loss=0.8477
+ throughput/total_tokens=43,392,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=227/500000]
+ train/ActionNoiseL2Loss=0.7836
+ throughput/total_tokens=43,584,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=228/500000]
+ train/ActionNoiseL2Loss=0.7721
+ throughput/total_tokens=43,776,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=229/500000]
+ train/ActionNoiseL2Loss=0.9040
+ throughput/total_tokens=43,968,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=230/500000]
+ train/ActionNoiseL2Loss=0.6665
+ throughput/total_tokens=44,160,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=231/500000]
+ train/ActionNoiseL2Loss=0.7095
+ throughput/total_tokens=44,352,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=232/500000]
+ train/ActionNoiseL2Loss=0.7321
+ throughput/total_tokens=44,544,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=233/500000]
+ train/ActionNoiseL2Loss=0.6439
+ throughput/total_tokens=44,736,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=234/500000]
+ train/ActionNoiseL2Loss=0.7442
+ throughput/total_tokens=44,928,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=235/500000]
+ train/ActionNoiseL2Loss=0.8174
+ throughput/total_tokens=45,120,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=236/500000]
+ train/ActionNoiseL2Loss=0.6767
+ throughput/total_tokens=45,312,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=237/500000]
+ train/ActionNoiseL2Loss=0.6855
+ throughput/total_tokens=45,504,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=238/500000]
+ train/ActionNoiseL2Loss=0.6094
+ throughput/total_tokens=45,696,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=239/500000]
+ train/ActionNoiseL2Loss=0.5974
+ throughput/total_tokens=45,888,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=240/500000]
+ optim/total_grad_norm=15.71
+ train/ActionNoiseL2Loss=0.6939
+ throughput/total_tokens=46,080,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=241/500000]
+ train/ActionNoiseL2Loss=0.6481
+ throughput/total_tokens=46,272,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=242/500000]
+ train/ActionNoiseL2Loss=0.6972
+ throughput/total_tokens=46,464,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=243/500000]
+ train/ActionNoiseL2Loss=0.6074
+ throughput/total_tokens=46,656,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=244/500000]
+ train/ActionNoiseL2Loss=0.6945
+ throughput/total_tokens=46,848,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=245/500000]
+ train/ActionNoiseL2Loss=0.7140
+ throughput/total_tokens=47,040,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=246/500000]
+ train/ActionNoiseL2Loss=0.6482
+ throughput/total_tokens=47,232,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=247/500000]
+ train/ActionNoiseL2Loss=0.7216
+ throughput/total_tokens=47,424,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=248/500000]
+ train/ActionNoiseL2Loss=0.8001
+ throughput/total_tokens=47,616,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=249/500000]
+ train/ActionNoiseL2Loss=0.7049
+ throughput/total_tokens=47,808,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=250/500000]
+ train/ActionNoiseL2Loss=0.6543
+ throughput/total_tokens=48,000,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=251/500000]
+ train/ActionNoiseL2Loss=0.5755
+ throughput/total_tokens=48,192,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=252/500000]
+ train/ActionNoiseL2Loss=0.5681
+ throughput/total_tokens=48,384,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=253/500000]
+ train/ActionNoiseL2Loss=0.6114
+ throughput/total_tokens=48,576,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=254/500000]
+ train/ActionNoiseL2Loss=0.5433
+ throughput/total_tokens=48,768,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=255/500000]
+ train/ActionNoiseL2Loss=0.4787
+ throughput/total_tokens=48,960,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=256/500000]
+ train/ActionNoiseL2Loss=0.6423
+ throughput/total_tokens=49,152,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=257/500000]
+ train/ActionNoiseL2Loss=0.5736
+ throughput/total_tokens=49,344,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=258/500000]
+ train/ActionNoiseL2Loss=0.5757
+ throughput/total_tokens=49,536,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=259/500000]
+ train/ActionNoiseL2Loss=0.6543
+ throughput/total_tokens=49,728,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=260/500000]
+ optim/total_grad_norm=15.90
+ train/ActionNoiseL2Loss=0.7440
+ throughput/total_tokens=49,920,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=261/500000]
+ train/ActionNoiseL2Loss=0.5196
+ throughput/total_tokens=50,112,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=262/500000]
+ train/ActionNoiseL2Loss=0.5877
+ throughput/total_tokens=50,304,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=263/500000]
+ train/ActionNoiseL2Loss=0.5693
+ throughput/total_tokens=50,496,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=264/500000]
+ train/ActionNoiseL2Loss=0.5388
+ throughput/total_tokens=50,688,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=265/500000]
+ train/ActionNoiseL2Loss=0.6032
+ throughput/total_tokens=50,880,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=266/500000]
+ train/ActionNoiseL2Loss=0.5574
+ throughput/total_tokens=51,072,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=267/500000]
+ train/ActionNoiseL2Loss=0.5675
+ throughput/total_tokens=51,264,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=268/500000]
+ train/ActionNoiseL2Loss=0.5242
+ throughput/total_tokens=51,456,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=269/500000]
+ train/ActionNoiseL2Loss=0.6309
+ throughput/total_tokens=51,648,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=270/500000]
+ train/ActionNoiseL2Loss=0.6047
+ throughput/total_tokens=51,840,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=271/500000]
+ train/ActionNoiseL2Loss=0.6273
+ throughput/total_tokens=52,032,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=272/500000]
+ train/ActionNoiseL2Loss=0.6132
+ throughput/total_tokens=52,224,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=273/500000]
+ train/ActionNoiseL2Loss=0.4889
+ throughput/total_tokens=52,416,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=274/500000]
+ train/ActionNoiseL2Loss=0.5722
+ throughput/total_tokens=52,608,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=275/500000]
+ train/ActionNoiseL2Loss=0.4977
+ throughput/total_tokens=52,800,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=276/500000]
+ train/ActionNoiseL2Loss=0.5368
+ throughput/total_tokens=52,992,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=277/500000]
+ train/ActionNoiseL2Loss=0.5937
+ throughput/total_tokens=53,184,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=278/500000]
+ train/ActionNoiseL2Loss=0.6018
+ throughput/total_tokens=53,376,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=279/500000]
+ train/ActionNoiseL2Loss=0.5590
+ throughput/total_tokens=53,568,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=280/500000]
+ optim/total_grad_norm=13.25
+ train/ActionNoiseL2Loss=0.5959
+ throughput/total_tokens=53,760,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=281/500000]
+ train/ActionNoiseL2Loss=0.5487
+ throughput/total_tokens=53,952,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=282/500000]
+ train/ActionNoiseL2Loss=0.6261
+ throughput/total_tokens=54,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=283/500000]
+ train/ActionNoiseL2Loss=0.4730
+ throughput/total_tokens=54,336,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=284/500000]
+ train/ActionNoiseL2Loss=0.4971
+ throughput/total_tokens=54,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=285/500000]
+ train/ActionNoiseL2Loss=0.4252
+ throughput/total_tokens=54,720,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=286/500000]
+ train/ActionNoiseL2Loss=0.5345
+ throughput/total_tokens=54,912,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=287/500000]
+ train/ActionNoiseL2Loss=0.6434
+ throughput/total_tokens=55,104,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=288/500000]
+ train/ActionNoiseL2Loss=0.6090
+ throughput/total_tokens=55,296,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=289/500000]
+ train/ActionNoiseL2Loss=0.6755
+ throughput/total_tokens=55,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=290/500000]
+ train/ActionNoiseL2Loss=0.5945
+ throughput/total_tokens=55,680,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=291/500000]
+ train/ActionNoiseL2Loss=0.5015
+ throughput/total_tokens=55,872,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=292/500000]
+ train/ActionNoiseL2Loss=0.4377
+ throughput/total_tokens=56,064,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=293/500000]
+ train/ActionNoiseL2Loss=0.4649
+ throughput/total_tokens=56,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=294/500000]
+ train/ActionNoiseL2Loss=0.3879
+ throughput/total_tokens=56,448,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=295/500000]
+ train/ActionNoiseL2Loss=0.3933
+ throughput/total_tokens=56,640,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=296/500000]
+ train/ActionNoiseL2Loss=0.4337
+ throughput/total_tokens=56,832,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=297/500000]
+ train/ActionNoiseL2Loss=0.5369
+ throughput/total_tokens=57,024,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=298/500000]
+ train/ActionNoiseL2Loss=0.5134
+ throughput/total_tokens=57,216,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=299/500000]
+ train/ActionNoiseL2Loss=0.4198
+ throughput/total_tokens=57,408,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=300/500000]
+ optim/total_grad_norm=16.60
+ train/ActionNoiseL2Loss=0.6567
+ throughput/total_tokens=57,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=301/500000]
+ train/ActionNoiseL2Loss=0.4723
+ throughput/total_tokens=57,792,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=302/500000]
+ train/ActionNoiseL2Loss=0.4517
+ throughput/total_tokens=57,984,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=303/500000]
+ train/ActionNoiseL2Loss=0.3371
+ throughput/total_tokens=58,176,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=304/500000]
+ train/ActionNoiseL2Loss=0.4962
+ throughput/total_tokens=58,368,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=305/500000]
+ train/ActionNoiseL2Loss=0.5007
+ throughput/total_tokens=58,560,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=306/500000]
+ train/ActionNoiseL2Loss=0.5200
+ throughput/total_tokens=58,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=307/500000]
+ train/ActionNoiseL2Loss=0.5558
+ throughput/total_tokens=58,944,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=308/500000]
+ train/ActionNoiseL2Loss=0.4949
+ throughput/total_tokens=59,136,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=309/500000]
+ train/ActionNoiseL2Loss=0.4176
+ throughput/total_tokens=59,328,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=310/500000]
+ train/ActionNoiseL2Loss=0.4637
+ throughput/total_tokens=59,520,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=311/500000]
+ train/ActionNoiseL2Loss=0.4465
+ throughput/total_tokens=59,712,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=312/500000]
+ train/ActionNoiseL2Loss=0.3855
+ throughput/total_tokens=59,904,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=313/500000]
+ train/ActionNoiseL2Loss=0.4994
+ throughput/total_tokens=60,096,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=314/500000]
+ train/ActionNoiseL2Loss=0.4003
+ throughput/total_tokens=60,288,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=315/500000]
+ train/ActionNoiseL2Loss=0.3789
+ throughput/total_tokens=60,480,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=316/500000]
+ train/ActionNoiseL2Loss=0.4288
+ throughput/total_tokens=60,672,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=317/500000]
+ train/ActionNoiseL2Loss=0.3468
+ throughput/total_tokens=60,864,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=318/500000]
+ train/ActionNoiseL2Loss=0.4258
+ throughput/total_tokens=61,056,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=319/500000]
+ train/ActionNoiseL2Loss=0.4437
+ throughput/total_tokens=61,248,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=320/500000]
+ optim/total_grad_norm=10.41
+ train/ActionNoiseL2Loss=0.3239
+ throughput/total_tokens=61,440,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=321/500000]
+ train/ActionNoiseL2Loss=0.4448
+ throughput/total_tokens=61,632,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=322/500000]
+ train/ActionNoiseL2Loss=0.5381
+ throughput/total_tokens=61,824,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=323/500000]
+ train/ActionNoiseL2Loss=0.5212
+ throughput/total_tokens=62,016,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=324/500000]
+ train/ActionNoiseL2Loss=0.4197
+ throughput/total_tokens=62,208,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=325/500000]
+ train/ActionNoiseL2Loss=0.6209
+ throughput/total_tokens=62,400,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=326/500000]
+ train/ActionNoiseL2Loss=0.4660
+ throughput/total_tokens=62,592,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=327/500000]
+ train/ActionNoiseL2Loss=0.4564
+ throughput/total_tokens=62,784,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=328/500000]
+ train/ActionNoiseL2Loss=0.4279
+ throughput/total_tokens=62,976,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=329/500000]
+ train/ActionNoiseL2Loss=0.4283
+ throughput/total_tokens=63,168,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=330/500000]
+ train/ActionNoiseL2Loss=0.5978
+ throughput/total_tokens=63,360,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=331/500000]
+ train/ActionNoiseL2Loss=0.4106
+ throughput/total_tokens=63,552,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=332/500000]
+ train/ActionNoiseL2Loss=0.4279
+ throughput/total_tokens=63,744,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=333/500000]
+ train/ActionNoiseL2Loss=0.3783
+ throughput/total_tokens=63,936,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=334/500000]
+ train/ActionNoiseL2Loss=0.4245
+ throughput/total_tokens=64,128,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=335/500000]
+ train/ActionNoiseL2Loss=0.3137
+ throughput/total_tokens=64,320,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=336/500000]
+ train/ActionNoiseL2Loss=0.3230
+ throughput/total_tokens=64,512,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=337/500000]
+ train/ActionNoiseL2Loss=0.4777
+ throughput/total_tokens=64,704,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=338/500000]
+ train/ActionNoiseL2Loss=0.6340
+ throughput/total_tokens=64,896,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=339/500000]
+ train/ActionNoiseL2Loss=0.6018
+ throughput/total_tokens=65,088,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=340/500000]
+ optim/total_grad_norm=13.52
+ train/ActionNoiseL2Loss=0.3224
+ throughput/total_tokens=65,280,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=341/500000]
+ train/ActionNoiseL2Loss=0.4713
+ throughput/total_tokens=65,472,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=342/500000]
+ train/ActionNoiseL2Loss=0.5232
+ throughput/total_tokens=65,664,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=343/500000]
+ train/ActionNoiseL2Loss=0.3912
+ throughput/total_tokens=65,856,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=344/500000]
+ train/ActionNoiseL2Loss=0.2949
+ throughput/total_tokens=66,048,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=345/500000]
+ train/ActionNoiseL2Loss=0.4340
+ throughput/total_tokens=66,240,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=346/500000]
+ train/ActionNoiseL2Loss=0.3657
+ throughput/total_tokens=66,432,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=347/500000]
+ train/ActionNoiseL2Loss=0.3272
+ throughput/total_tokens=66,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=348/500000]
+ train/ActionNoiseL2Loss=0.4544
+ throughput/total_tokens=66,816,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=349/500000]
+ train/ActionNoiseL2Loss=0.6187
+ throughput/total_tokens=67,008,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=350/500000]
+ train/ActionNoiseL2Loss=0.3868
+ throughput/total_tokens=67,200,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=351/500000]
+ train/ActionNoiseL2Loss=0.3791
+ throughput/total_tokens=67,392,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=352/500000]
+ train/ActionNoiseL2Loss=0.4713
+ throughput/total_tokens=67,584,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=353/500000]
+ train/ActionNoiseL2Loss=0.4811
+ throughput/total_tokens=67,776,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=354/500000]
+ train/ActionNoiseL2Loss=0.3299
+ throughput/total_tokens=67,968,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=355/500000]
+ train/ActionNoiseL2Loss=0.4993
+ throughput/total_tokens=68,160,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=356/500000]
+ train/ActionNoiseL2Loss=0.4383
+ throughput/total_tokens=68,352,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=357/500000]
+ train/ActionNoiseL2Loss=0.4703
+ throughput/total_tokens=68,544,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=358/500000]
+ train/ActionNoiseL2Loss=0.5352
+ throughput/total_tokens=68,736,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=359/500000]
+ train/ActionNoiseL2Loss=0.3142
+ throughput/total_tokens=68,928,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=360/500000]
+ optim/total_grad_norm=11.87
+ train/ActionNoiseL2Loss=0.3465
+ throughput/total_tokens=69,120,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=361/500000]
+ train/ActionNoiseL2Loss=0.3536
+ throughput/total_tokens=69,312,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=362/500000]
+ train/ActionNoiseL2Loss=0.5516
+ throughput/total_tokens=69,504,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=363/500000]
+ train/ActionNoiseL2Loss=0.4358
+ throughput/total_tokens=69,696,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=364/500000]
+ train/ActionNoiseL2Loss=0.4278
+ throughput/total_tokens=69,888,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=365/500000]
+ train/ActionNoiseL2Loss=0.3890
+ throughput/total_tokens=70,080,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=366/500000]
+ train/ActionNoiseL2Loss=0.3932
+ throughput/total_tokens=70,272,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=367/500000]
+ train/ActionNoiseL2Loss=0.4159
+ throughput/total_tokens=70,464,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=368/500000]
+ train/ActionNoiseL2Loss=0.4403
+ throughput/total_tokens=70,656,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=369/500000]
+ train/ActionNoiseL2Loss=0.3165
+ throughput/total_tokens=70,848,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=370/500000]
+ train/ActionNoiseL2Loss=0.4008
+ throughput/total_tokens=71,040,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=371/500000]
+ train/ActionNoiseL2Loss=0.3687
+ throughput/total_tokens=71,232,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=372/500000]
+ train/ActionNoiseL2Loss=0.2853
+ throughput/total_tokens=71,424,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=373/500000]
+ train/ActionNoiseL2Loss=0.3156
+ throughput/total_tokens=71,616,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=374/500000]
+ train/ActionNoiseL2Loss=0.4810
+ throughput/total_tokens=71,808,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=375/500000]
+ train/ActionNoiseL2Loss=0.4210
+ throughput/total_tokens=72,000,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=376/500000]
+ train/ActionNoiseL2Loss=0.4172
+ throughput/total_tokens=72,192,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=377/500000]
+ train/ActionNoiseL2Loss=0.4341
+ throughput/total_tokens=72,384,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=378/500000]
+ train/ActionNoiseL2Loss=0.3559
+ throughput/total_tokens=72,576,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=379/500000]
+ train/ActionNoiseL2Loss=0.3259
+ throughput/total_tokens=72,768,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=380/500000]
+ optim/total_grad_norm=12.36
+ train/ActionNoiseL2Loss=0.3781
+ throughput/total_tokens=72,960,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,538
+[step=381/500000]
+ train/ActionNoiseL2Loss=0.2838
+ throughput/total_tokens=73,152,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=382/500000]
+ train/ActionNoiseL2Loss=0.2930
+ throughput/total_tokens=73,344,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=383/500000]
+ train/ActionNoiseL2Loss=0.5354
+ throughput/total_tokens=73,536,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=384/500000]
+ train/ActionNoiseL2Loss=0.4324
+ throughput/total_tokens=73,728,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=385/500000]
+ train/ActionNoiseL2Loss=0.3336
+ throughput/total_tokens=73,920,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=386/500000]
+ train/ActionNoiseL2Loss=0.4120
+ throughput/total_tokens=74,112,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=387/500000]
+ train/ActionNoiseL2Loss=0.3020
+ throughput/total_tokens=74,304,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=388/500000]
+ train/ActionNoiseL2Loss=0.2934
+ throughput/total_tokens=74,496,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=389/500000]
+ train/ActionNoiseL2Loss=0.2988
+ throughput/total_tokens=74,688,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=390/500000]
+ train/ActionNoiseL2Loss=0.2285
+ throughput/total_tokens=74,880,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=391/500000]
+ train/ActionNoiseL2Loss=0.4665
+ throughput/total_tokens=75,072,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=392/500000]
+ train/ActionNoiseL2Loss=0.3858
+ throughput/total_tokens=75,264,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=393/500000]
+ train/ActionNoiseL2Loss=0.3895
+ throughput/total_tokens=75,456,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=394/500000]
+ train/ActionNoiseL2Loss=0.4657
+ throughput/total_tokens=75,648,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=395/500000]
+ train/ActionNoiseL2Loss=0.4194
+ throughput/total_tokens=75,840,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=396/500000]
+ train/ActionNoiseL2Loss=0.3076
+ throughput/total_tokens=76,032,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=397/500000]
+ train/ActionNoiseL2Loss=0.4248
+ throughput/total_tokens=76,224,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=398/500000]
+ train/ActionNoiseL2Loss=0.3083
+ throughput/total_tokens=76,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=399/500000]
+ train/ActionNoiseL2Loss=0.3726
+ throughput/total_tokens=76,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=400/500000]
+ optim/total_grad_norm=9.611
+ train/ActionNoiseL2Loss=0.3398
+ throughput/total_tokens=76,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=401/500000]
+ train/ActionNoiseL2Loss=0.2977
+ throughput/total_tokens=76,992,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=402/500000]
+ train/ActionNoiseL2Loss=0.2983
+ throughput/total_tokens=77,184,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=403/500000]
+ train/ActionNoiseL2Loss=0.2892
+ throughput/total_tokens=77,376,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=404/500000]
+ train/ActionNoiseL2Loss=0.3507
+ throughput/total_tokens=77,568,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=405/500000]
+ train/ActionNoiseL2Loss=0.2835
+ throughput/total_tokens=77,760,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=406/500000]
+ train/ActionNoiseL2Loss=0.2985
+ throughput/total_tokens=77,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=407/500000]
+ train/ActionNoiseL2Loss=0.3638
+ throughput/total_tokens=78,144,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=408/500000]
+ train/ActionNoiseL2Loss=0.2865
+ throughput/total_tokens=78,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=409/500000]
+ train/ActionNoiseL2Loss=0.3489
+ throughput/total_tokens=78,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=410/500000]
+ train/ActionNoiseL2Loss=0.4658
+ throughput/total_tokens=78,720,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=411/500000]
+ train/ActionNoiseL2Loss=0.3667
+ throughput/total_tokens=78,912,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=412/500000]
+ train/ActionNoiseL2Loss=0.4374
+ throughput/total_tokens=79,104,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=413/500000]
+ train/ActionNoiseL2Loss=0.3767
+ throughput/total_tokens=79,296,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=414/500000]
+ train/ActionNoiseL2Loss=0.3424
+ throughput/total_tokens=79,488,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=415/500000]
+ train/ActionNoiseL2Loss=0.3056
+ throughput/total_tokens=79,680,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=416/500000]
+ train/ActionNoiseL2Loss=0.4384
+ throughput/total_tokens=79,872,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=417/500000]
+ train/ActionNoiseL2Loss=0.3103
+ throughput/total_tokens=80,064,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=418/500000]
+ train/ActionNoiseL2Loss=0.2467
+ throughput/total_tokens=80,256,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=419/500000]
+ train/ActionNoiseL2Loss=0.3984
+ throughput/total_tokens=80,448,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=420/500000]
+ optim/total_grad_norm=9.753
+ train/ActionNoiseL2Loss=0.3935
+ throughput/total_tokens=80,640,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=421/500000]
+ train/ActionNoiseL2Loss=0.4430
+ throughput/total_tokens=80,832,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=422/500000]
+ train/ActionNoiseL2Loss=0.2854
+ throughput/total_tokens=81,024,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=423/500000]
+ train/ActionNoiseL2Loss=0.3305
+ throughput/total_tokens=81,216,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=424/500000]
+ train/ActionNoiseL2Loss=0.2324
+ throughput/total_tokens=81,408,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=425/500000]
+ train/ActionNoiseL2Loss=0.3971
+ throughput/total_tokens=81,600,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=426/500000]
+ train/ActionNoiseL2Loss=0.3199
+ throughput/total_tokens=81,792,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=427/500000]
+ train/ActionNoiseL2Loss=0.3133
+ throughput/total_tokens=81,984,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=428/500000]
+ train/ActionNoiseL2Loss=0.3207
+ throughput/total_tokens=82,176,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=429/500000]
+ train/ActionNoiseL2Loss=0.3267
+ throughput/total_tokens=82,368,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=430/500000]
+ train/ActionNoiseL2Loss=0.2374
+ throughput/total_tokens=82,560,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=431/500000]
+ train/ActionNoiseL2Loss=0.3198
+ throughput/total_tokens=82,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=432/500000]
+ train/ActionNoiseL2Loss=0.2796
+ throughput/total_tokens=82,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=433/500000]
+ train/ActionNoiseL2Loss=0.2846
+ throughput/total_tokens=83,136,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=434/500000]
+ train/ActionNoiseL2Loss=0.2340
+ throughput/total_tokens=83,328,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=435/500000]
+ train/ActionNoiseL2Loss=0.2615
+ throughput/total_tokens=83,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=436/500000]
+ train/ActionNoiseL2Loss=0.3175
+ throughput/total_tokens=83,712,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=437/500000]
+ train/ActionNoiseL2Loss=0.4548
+ throughput/total_tokens=83,904,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=438/500000]
+ train/ActionNoiseL2Loss=0.2971
+ throughput/total_tokens=84,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=439/500000]
+ train/ActionNoiseL2Loss=0.2830
+ throughput/total_tokens=84,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=440/500000]
+ optim/total_grad_norm=8.538
+ train/ActionNoiseL2Loss=0.2830
+ throughput/total_tokens=84,480,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=441/500000]
+ train/ActionNoiseL2Loss=0.2912
+ throughput/total_tokens=84,672,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=442/500000]
+ train/ActionNoiseL2Loss=0.3084
+ throughput/total_tokens=84,864,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=443/500000]
+ train/ActionNoiseL2Loss=0.3699
+ throughput/total_tokens=85,056,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=444/500000]
+ train/ActionNoiseL2Loss=0.3149
+ throughput/total_tokens=85,248,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=445/500000]
+ train/ActionNoiseL2Loss=0.3681
+ throughput/total_tokens=85,440,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=446/500000]
+ train/ActionNoiseL2Loss=0.2803
+ throughput/total_tokens=85,632,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=447/500000]
+ train/ActionNoiseL2Loss=0.3598
+ throughput/total_tokens=85,824,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=448/500000]
+ train/ActionNoiseL2Loss=0.3594
+ throughput/total_tokens=86,016,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=449/500000]
+ train/ActionNoiseL2Loss=0.3335
+ throughput/total_tokens=86,208,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=450/500000]
+ train/ActionNoiseL2Loss=0.2849
+ throughput/total_tokens=86,400,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=451/500000]
+ train/ActionNoiseL2Loss=0.3439
+ throughput/total_tokens=86,592,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=452/500000]
+ train/ActionNoiseL2Loss=0.3473
+ throughput/total_tokens=86,784,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=453/500000]
+ train/ActionNoiseL2Loss=0.3879
+ throughput/total_tokens=86,976,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=454/500000]
+ train/ActionNoiseL2Loss=0.2732
+ throughput/total_tokens=87,168,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=455/500000]
+ train/ActionNoiseL2Loss=0.4355
+ throughput/total_tokens=87,360,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=456/500000]
+ train/ActionNoiseL2Loss=0.4018
+ throughput/total_tokens=87,552,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=457/500000]
+ train/ActionNoiseL2Loss=0.3533
+ throughput/total_tokens=87,744,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=458/500000]
+ train/ActionNoiseL2Loss=0.3515
+ throughput/total_tokens=87,936,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=459/500000]
+ train/ActionNoiseL2Loss=0.2146
+ throughput/total_tokens=88,128,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=460/500000]
+ optim/total_grad_norm=10.51
+ train/ActionNoiseL2Loss=0.3686
+ throughput/total_tokens=88,320,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,538
+[step=461/500000]
+ train/ActionNoiseL2Loss=0.3390
+ throughput/total_tokens=88,512,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=462/500000]
+ train/ActionNoiseL2Loss=0.3693
+ throughput/total_tokens=88,704,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=463/500000]
+ train/ActionNoiseL2Loss=0.3094
+ throughput/total_tokens=88,896,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=464/500000]
+ train/ActionNoiseL2Loss=0.3452
+ throughput/total_tokens=89,088,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=465/500000]
+ train/ActionNoiseL2Loss=0.2234
+ throughput/total_tokens=89,280,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=466/500000]
+ train/ActionNoiseL2Loss=0.2093
+ throughput/total_tokens=89,472,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=467/500000]
+ train/ActionNoiseL2Loss=0.2759
+ throughput/total_tokens=89,664,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=468/500000]
+ train/ActionNoiseL2Loss=0.4306
+ throughput/total_tokens=89,856,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=469/500000]
+ train/ActionNoiseL2Loss=0.2630
+ throughput/total_tokens=90,048,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=470/500000]
+ train/ActionNoiseL2Loss=0.3560
+ throughput/total_tokens=90,240,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=471/500000]
+ train/ActionNoiseL2Loss=0.2218
+ throughput/total_tokens=90,432,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=472/500000]
+ train/ActionNoiseL2Loss=0.2368
+ throughput/total_tokens=90,624,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=473/500000]
+ train/ActionNoiseL2Loss=0.3178
+ throughput/total_tokens=90,816,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=474/500000]
+ train/ActionNoiseL2Loss=0.2741
+ throughput/total_tokens=91,008,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=475/500000]
+ train/ActionNoiseL2Loss=0.2124
+ throughput/total_tokens=91,200,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=476/500000]
+ train/ActionNoiseL2Loss=0.2653
+ throughput/total_tokens=91,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=477/500000]
+ train/ActionNoiseL2Loss=0.2934
+ throughput/total_tokens=91,584,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=478/500000]
+ train/ActionNoiseL2Loss=0.2190
+ throughput/total_tokens=91,776,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=479/500000]
+ train/ActionNoiseL2Loss=0.3514
+ throughput/total_tokens=91,968,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=480/500000]
+ optim/total_grad_norm=9.003
+ train/ActionNoiseL2Loss=0.2904
+ throughput/total_tokens=92,160,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=481/500000]
+ train/ActionNoiseL2Loss=0.3123
+ throughput/total_tokens=92,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=482/500000]
+ train/ActionNoiseL2Loss=0.2579
+ throughput/total_tokens=92,544,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=483/500000]
+ train/ActionNoiseL2Loss=0.3054
+ throughput/total_tokens=92,736,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=484/500000]
+ train/ActionNoiseL2Loss=0.2273
+ throughput/total_tokens=92,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=485/500000]
+ train/ActionNoiseL2Loss=0.2724
+ throughput/total_tokens=93,120,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=486/500000]
+ train/ActionNoiseL2Loss=0.2402
+ throughput/total_tokens=93,312,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=487/500000]
+ train/ActionNoiseL2Loss=0.2622
+ throughput/total_tokens=93,504,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=488/500000]
+ train/ActionNoiseL2Loss=0.2853
+ throughput/total_tokens=93,696,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=489/500000]
+ train/ActionNoiseL2Loss=0.2913
+ throughput/total_tokens=93,888,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=490/500000]
+ train/ActionNoiseL2Loss=0.2728
+ throughput/total_tokens=94,080,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+[step=491/500000]
+ train/ActionNoiseL2Loss=0.2351
+ throughput/total_tokens=94,272,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=492/500000]
+ train/ActionNoiseL2Loss=0.3187
+ throughput/total_tokens=94,464,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=493/500000]
+ train/ActionNoiseL2Loss=0.2703
+ throughput/total_tokens=94,656,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=494/500000]
+ train/ActionNoiseL2Loss=0.2841
+ throughput/total_tokens=94,848,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=495/500000]
+ train/ActionNoiseL2Loss=0.3328
+ throughput/total_tokens=95,040,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=496/500000]
+ train/ActionNoiseL2Loss=0.4015
+ throughput/total_tokens=95,232,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=497/500000]
+ train/ActionNoiseL2Loss=0.2514
+ throughput/total_tokens=95,424,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=498/500000]
+ train/ActionNoiseL2Loss=0.3198
+ throughput/total_tokens=95,616,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=499/500000]
+ train/ActionNoiseL2Loss=0.2495
+ throughput/total_tokens=95,808,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=500/500000]
+ optim/total_grad_norm=8.176
+ train/ActionNoiseL2Loss=0.2218
+ throughput/total_tokens=96,000,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,538
+09/28 [13:51:11] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109
+ FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and
+ set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc:
+ https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial:
+ https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html .
+ warnings.warn(
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109
+ `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object
+ collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use
+ `_device_capability(group)`.
+ warnings.warn(
+
+09/28 [13:51:14] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ local_shape = tensor.shape
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.shape,
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.dtype,
+
+09/28 [13:51:17] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109
+ instead and we are deprecating ShardedTensor.
+ result = torch_func_method(public_api, types, args, kwargs)
+
+09/28 [13:51:33] INFO | >> Saving config... checkpoint.py:608
+09/28 [13:51:59] INFO | >> Saving model state... checkpoint.py:796
+09/28 [13:53:02] INFO | >> Saving optim state... checkpoint.py:811
+09/28 [13:53:06] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=501/500000]
+ train/ActionNoiseL2Loss=0.3292
+ throughput/total_tokens=96,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=502/500000]
+ train/ActionNoiseL2Loss=0.2568
+ throughput/total_tokens=96,384,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=503/500000]
+ train/ActionNoiseL2Loss=0.3753
+ throughput/total_tokens=96,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=504/500000]
+ train/ActionNoiseL2Loss=0.4193
+ throughput/total_tokens=96,768,000
+ throughput/device/tokens_per_second=1,125
+ throughput/device/batches_per_second=0.0469
+[step=505/500000]
+ train/ActionNoiseL2Loss=0.3637
+ throughput/total_tokens=96,960,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=506/500000]
+ train/ActionNoiseL2Loss=0.2872
+ throughput/total_tokens=97,152,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=507/500000]
+ train/ActionNoiseL2Loss=0.2756
+ throughput/total_tokens=97,344,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=508/500000]
+ train/ActionNoiseL2Loss=0.2701
+ throughput/total_tokens=97,536,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=509/500000]
+ train/ActionNoiseL2Loss=0.3091
+ throughput/total_tokens=97,728,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=510/500000]
+ train/ActionNoiseL2Loss=0.3156
+ throughput/total_tokens=97,920,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,539
+[step=511/500000]
+ train/ActionNoiseL2Loss=0.3417
+ throughput/total_tokens=98,112,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=512/500000]
+ train/ActionNoiseL2Loss=0.3560
+ throughput/total_tokens=98,304,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=513/500000]
+ train/ActionNoiseL2Loss=0.3306
+ throughput/total_tokens=98,496,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=514/500000]
+ train/ActionNoiseL2Loss=0.2578
+ throughput/total_tokens=98,688,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=515/500000]
+ train/ActionNoiseL2Loss=0.3133
+ throughput/total_tokens=98,880,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=516/500000]
+ train/ActionNoiseL2Loss=0.2892
+ throughput/total_tokens=99,072,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=517/500000]
+ train/ActionNoiseL2Loss=0.2083
+ throughput/total_tokens=99,264,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=518/500000]
+ train/ActionNoiseL2Loss=0.2249
+ throughput/total_tokens=99,456,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=519/500000]
+ train/ActionNoiseL2Loss=0.4636
+ throughput/total_tokens=99,648,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=520/500000]
+ optim/total_grad_norm=9.939
+ train/ActionNoiseL2Loss=0.2560
+ throughput/total_tokens=99,840,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=521/500000]
+ train/ActionNoiseL2Loss=0.2706
+ throughput/total_tokens=100,032,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=522/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=100,224,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=523/500000]
+ train/ActionNoiseL2Loss=0.2690
+ throughput/total_tokens=100,416,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=524/500000]
+ train/ActionNoiseL2Loss=0.3758
+ throughput/total_tokens=100,608,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=525/500000]
+ train/ActionNoiseL2Loss=0.4230
+ throughput/total_tokens=100,800,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=526/500000]
+ train/ActionNoiseL2Loss=0.2491
+ throughput/total_tokens=100,992,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=527/500000]
+ train/ActionNoiseL2Loss=0.3528
+ throughput/total_tokens=101,184,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=528/500000]
+ train/ActionNoiseL2Loss=0.1798
+ throughput/total_tokens=101,376,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=529/500000]
+ train/ActionNoiseL2Loss=0.2365
+ throughput/total_tokens=101,568,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=530/500000]
+ train/ActionNoiseL2Loss=0.5582
+ throughput/total_tokens=101,760,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=531/500000]
+ train/ActionNoiseL2Loss=0.2694
+ throughput/total_tokens=101,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=532/500000]
+ train/ActionNoiseL2Loss=0.3639
+ throughput/total_tokens=102,144,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=533/500000]
+ train/ActionNoiseL2Loss=0.4570
+ throughput/total_tokens=102,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=534/500000]
+ train/ActionNoiseL2Loss=0.3114
+ throughput/total_tokens=102,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=535/500000]
+ train/ActionNoiseL2Loss=0.4325
+ throughput/total_tokens=102,720,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=536/500000]
+ train/ActionNoiseL2Loss=0.3453
+ throughput/total_tokens=102,912,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=537/500000]
+ train/ActionNoiseL2Loss=0.5251
+ throughput/total_tokens=103,104,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=538/500000]
+ train/ActionNoiseL2Loss=0.3858
+ throughput/total_tokens=103,296,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=539/500000]
+ train/ActionNoiseL2Loss=0.2192
+ throughput/total_tokens=103,488,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=540/500000]
+ optim/total_grad_norm=7.433
+ train/ActionNoiseL2Loss=0.2205
+ throughput/total_tokens=103,680,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=541/500000]
+ train/ActionNoiseL2Loss=0.2121
+ throughput/total_tokens=103,872,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=542/500000]
+ train/ActionNoiseL2Loss=0.2512
+ throughput/total_tokens=104,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=543/500000]
+ train/ActionNoiseL2Loss=0.2337
+ throughput/total_tokens=104,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=544/500000]
+ train/ActionNoiseL2Loss=0.2656
+ throughput/total_tokens=104,448,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=545/500000]
+ train/ActionNoiseL2Loss=0.2926
+ throughput/total_tokens=104,640,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=546/500000]
+ train/ActionNoiseL2Loss=0.2718
+ throughput/total_tokens=104,832,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=547/500000]
+ train/ActionNoiseL2Loss=0.1591
+ throughput/total_tokens=105,024,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=548/500000]
+ train/ActionNoiseL2Loss=0.2836
+ throughput/total_tokens=105,216,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=549/500000]
+ train/ActionNoiseL2Loss=0.1718
+ throughput/total_tokens=105,408,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=550/500000]
+ train/ActionNoiseL2Loss=0.2984
+ throughput/total_tokens=105,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=551/500000]
+ train/ActionNoiseL2Loss=0.2812
+ throughput/total_tokens=105,792,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=552/500000]
+ train/ActionNoiseL2Loss=0.2118
+ throughput/total_tokens=105,984,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=553/500000]
+ train/ActionNoiseL2Loss=0.2217
+ throughput/total_tokens=106,176,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=554/500000]
+ train/ActionNoiseL2Loss=0.3208
+ throughput/total_tokens=106,368,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=555/500000]
+ train/ActionNoiseL2Loss=0.4067
+ throughput/total_tokens=106,560,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=556/500000]
+ train/ActionNoiseL2Loss=0.2080
+ throughput/total_tokens=106,752,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=557/500000]
+ train/ActionNoiseL2Loss=0.2433
+ throughput/total_tokens=106,944,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=558/500000]
+ train/ActionNoiseL2Loss=0.3687
+ throughput/total_tokens=107,136,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=559/500000]
+ train/ActionNoiseL2Loss=0.3569
+ throughput/total_tokens=107,328,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=560/500000]
+ optim/total_grad_norm=11.08
+ train/ActionNoiseL2Loss=0.2149
+ throughput/total_tokens=107,520,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=561/500000]
+ train/ActionNoiseL2Loss=0.3996
+ throughput/total_tokens=107,712,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=562/500000]
+ train/ActionNoiseL2Loss=0.2385
+ throughput/total_tokens=107,904,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=563/500000]
+ train/ActionNoiseL2Loss=0.3098
+ throughput/total_tokens=108,096,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=564/500000]
+ train/ActionNoiseL2Loss=0.3337
+ throughput/total_tokens=108,288,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=565/500000]
+ train/ActionNoiseL2Loss=0.2999
+ throughput/total_tokens=108,480,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=566/500000]
+ train/ActionNoiseL2Loss=0.2024
+ throughput/total_tokens=108,672,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=567/500000]
+ train/ActionNoiseL2Loss=0.2304
+ throughput/total_tokens=108,864,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=568/500000]
+ train/ActionNoiseL2Loss=0.4856
+ throughput/total_tokens=109,056,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=569/500000]
+ train/ActionNoiseL2Loss=0.2016
+ throughput/total_tokens=109,248,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=570/500000]
+ train/ActionNoiseL2Loss=0.2579
+ throughput/total_tokens=109,440,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=571/500000]
+ train/ActionNoiseL2Loss=0.3084
+ throughput/total_tokens=109,632,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=572/500000]
+ train/ActionNoiseL2Loss=0.1935
+ throughput/total_tokens=109,824,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=573/500000]
+ train/ActionNoiseL2Loss=0.2350
+ throughput/total_tokens=110,016,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=574/500000]
+ train/ActionNoiseL2Loss=0.2103
+ throughput/total_tokens=110,208,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=575/500000]
+ train/ActionNoiseL2Loss=0.2580
+ throughput/total_tokens=110,400,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=576/500000]
+ train/ActionNoiseL2Loss=0.2625
+ throughput/total_tokens=110,592,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=577/500000]
+ train/ActionNoiseL2Loss=0.2244
+ throughput/total_tokens=110,784,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=578/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=110,976,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=579/500000]
+ train/ActionNoiseL2Loss=0.3054
+ throughput/total_tokens=111,168,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=580/500000]
+ optim/total_grad_norm=10.45
+ train/ActionNoiseL2Loss=0.3322
+ throughput/total_tokens=111,360,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=581/500000]
+ train/ActionNoiseL2Loss=0.4361
+ throughput/total_tokens=111,552,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=582/500000]
+ train/ActionNoiseL2Loss=0.2134
+ throughput/total_tokens=111,744,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=583/500000]
+ train/ActionNoiseL2Loss=0.2494
+ throughput/total_tokens=111,936,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=584/500000]
+ train/ActionNoiseL2Loss=0.3136
+ throughput/total_tokens=112,128,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=585/500000]
+ train/ActionNoiseL2Loss=0.2107
+ throughput/total_tokens=112,320,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=586/500000]
+ train/ActionNoiseL2Loss=0.2860
+ throughput/total_tokens=112,512,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=587/500000]
+ train/ActionNoiseL2Loss=0.2586
+ throughput/total_tokens=112,704,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=588/500000]
+ train/ActionNoiseL2Loss=0.3253
+ throughput/total_tokens=112,896,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=589/500000]
+ train/ActionNoiseL2Loss=0.3766
+ throughput/total_tokens=113,088,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=590/500000]
+ train/ActionNoiseL2Loss=0.3232
+ throughput/total_tokens=113,280,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=591/500000]
+ train/ActionNoiseL2Loss=0.2222
+ throughput/total_tokens=113,472,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=592/500000]
+ train/ActionNoiseL2Loss=0.2982
+ throughput/total_tokens=113,664,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=593/500000]
+ train/ActionNoiseL2Loss=0.3529
+ throughput/total_tokens=113,856,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=594/500000]
+ train/ActionNoiseL2Loss=0.3154
+ throughput/total_tokens=114,048,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=595/500000]
+ train/ActionNoiseL2Loss=0.3848
+ throughput/total_tokens=114,240,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=596/500000]
+ train/ActionNoiseL2Loss=0.2298
+ throughput/total_tokens=114,432,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=597/500000]
+ train/ActionNoiseL2Loss=0.3628
+ throughput/total_tokens=114,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=598/500000]
+ train/ActionNoiseL2Loss=0.2170
+ throughput/total_tokens=114,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=599/500000]
+ train/ActionNoiseL2Loss=0.3270
+ throughput/total_tokens=115,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=600/500000]
+ optim/total_grad_norm=7.714
+ train/ActionNoiseL2Loss=0.2286
+ throughput/total_tokens=115,200,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=601/500000]
+ train/ActionNoiseL2Loss=0.3832
+ throughput/total_tokens=115,392,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=602/500000]
+ train/ActionNoiseL2Loss=0.3520
+ throughput/total_tokens=115,584,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=603/500000]
+ train/ActionNoiseL2Loss=0.2291
+ throughput/total_tokens=115,776,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=604/500000]
+ train/ActionNoiseL2Loss=0.3090
+ throughput/total_tokens=115,968,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=605/500000]
+ train/ActionNoiseL2Loss=0.2839
+ throughput/total_tokens=116,160,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=606/500000]
+ train/ActionNoiseL2Loss=0.3118
+ throughput/total_tokens=116,352,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=607/500000]
+ train/ActionNoiseL2Loss=0.2505
+ throughput/total_tokens=116,544,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=608/500000]
+ train/ActionNoiseL2Loss=0.2150
+ throughput/total_tokens=116,736,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=609/500000]
+ train/ActionNoiseL2Loss=0.3094
+ throughput/total_tokens=116,928,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=610/500000]
+ train/ActionNoiseL2Loss=0.2740
+ throughput/total_tokens=117,120,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=611/500000]
+ train/ActionNoiseL2Loss=0.2692
+ throughput/total_tokens=117,312,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=612/500000]
+ train/ActionNoiseL2Loss=0.4599
+ throughput/total_tokens=117,504,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=613/500000]
+ train/ActionNoiseL2Loss=0.1965
+ throughput/total_tokens=117,696,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=614/500000]
+ train/ActionNoiseL2Loss=0.2105
+ throughput/total_tokens=117,888,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=615/500000]
+ train/ActionNoiseL2Loss=0.2792
+ throughput/total_tokens=118,080,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=616/500000]
+ train/ActionNoiseL2Loss=0.3497
+ throughput/total_tokens=118,272,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=617/500000]
+ train/ActionNoiseL2Loss=0.2428
+ throughput/total_tokens=118,464,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=618/500000]
+ train/ActionNoiseL2Loss=0.2402
+ throughput/total_tokens=118,656,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=619/500000]
+ train/ActionNoiseL2Loss=0.2984
+ throughput/total_tokens=118,848,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=620/500000]
+ optim/total_grad_norm=9.274
+ train/ActionNoiseL2Loss=0.1873
+ throughput/total_tokens=119,040,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=621/500000]
+ train/ActionNoiseL2Loss=0.3044
+ throughput/total_tokens=119,232,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=622/500000]
+ train/ActionNoiseL2Loss=0.3633
+ throughput/total_tokens=119,424,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=623/500000]
+ train/ActionNoiseL2Loss=0.2705
+ throughput/total_tokens=119,616,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=624/500000]
+ train/ActionNoiseL2Loss=0.3191
+ throughput/total_tokens=119,808,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=625/500000]
+ train/ActionNoiseL2Loss=0.2815
+ throughput/total_tokens=120,000,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=626/500000]
+ train/ActionNoiseL2Loss=0.2197
+ throughput/total_tokens=120,192,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=627/500000]
+ train/ActionNoiseL2Loss=0.2208
+ throughput/total_tokens=120,384,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=628/500000]
+ train/ActionNoiseL2Loss=0.4108
+ throughput/total_tokens=120,576,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=629/500000]
+ train/ActionNoiseL2Loss=0.3528
+ throughput/total_tokens=120,768,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=630/500000]
+ train/ActionNoiseL2Loss=0.3857
+ throughput/total_tokens=120,960,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=631/500000]
+ train/ActionNoiseL2Loss=0.2373
+ throughput/total_tokens=121,152,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=632/500000]
+ train/ActionNoiseL2Loss=0.4133
+ throughput/total_tokens=121,344,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=633/500000]
+ train/ActionNoiseL2Loss=0.2194
+ throughput/total_tokens=121,536,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=634/500000]
+ train/ActionNoiseL2Loss=0.2493
+ throughput/total_tokens=121,728,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=635/500000]
+ train/ActionNoiseL2Loss=0.2701
+ throughput/total_tokens=121,920,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=636/500000]
+ train/ActionNoiseL2Loss=0.3454
+ throughput/total_tokens=122,112,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=637/500000]
+ train/ActionNoiseL2Loss=0.2194
+ throughput/total_tokens=122,304,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=638/500000]
+ train/ActionNoiseL2Loss=0.3303
+ throughput/total_tokens=122,496,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=639/500000]
+ train/ActionNoiseL2Loss=0.2385
+ throughput/total_tokens=122,688,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=640/500000]
+ optim/total_grad_norm=9.676
+ train/ActionNoiseL2Loss=0.2355
+ throughput/total_tokens=122,880,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=641/500000]
+ train/ActionNoiseL2Loss=0.3504
+ throughput/total_tokens=123,072,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=642/500000]
+ train/ActionNoiseL2Loss=0.3036
+ throughput/total_tokens=123,264,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=643/500000]
+ train/ActionNoiseL2Loss=0.2885
+ throughput/total_tokens=123,456,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=644/500000]
+ train/ActionNoiseL2Loss=0.3331
+ throughput/total_tokens=123,648,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=645/500000]
+ train/ActionNoiseL2Loss=0.3556
+ throughput/total_tokens=123,840,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=646/500000]
+ train/ActionNoiseL2Loss=0.2610
+ throughput/total_tokens=124,032,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=647/500000]
+ train/ActionNoiseL2Loss=0.2354
+ throughput/total_tokens=124,224,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=648/500000]
+ train/ActionNoiseL2Loss=0.1936
+ throughput/total_tokens=124,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=649/500000]
+ train/ActionNoiseL2Loss=0.3038
+ throughput/total_tokens=124,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=650/500000]
+ train/ActionNoiseL2Loss=0.2818
+ throughput/total_tokens=124,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=651/500000]
+ train/ActionNoiseL2Loss=0.2078
+ throughput/total_tokens=124,992,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=652/500000]
+ train/ActionNoiseL2Loss=0.1732
+ throughput/total_tokens=125,184,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=653/500000]
+ train/ActionNoiseL2Loss=0.2200
+ throughput/total_tokens=125,376,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=654/500000]
+ train/ActionNoiseL2Loss=0.3249
+ throughput/total_tokens=125,568,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=655/500000]
+ train/ActionNoiseL2Loss=0.3284
+ throughput/total_tokens=125,760,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=656/500000]
+ train/ActionNoiseL2Loss=0.2500
+ throughput/total_tokens=125,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=657/500000]
+ train/ActionNoiseL2Loss=0.2120
+ throughput/total_tokens=126,144,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=658/500000]
+ train/ActionNoiseL2Loss=0.2766
+ throughput/total_tokens=126,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=659/500000]
+ train/ActionNoiseL2Loss=0.2316
+ throughput/total_tokens=126,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=660/500000]
+ optim/total_grad_norm=10.50
+ train/ActionNoiseL2Loss=0.3294
+ throughput/total_tokens=126,720,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=661/500000]
+ train/ActionNoiseL2Loss=0.3483
+ throughput/total_tokens=126,912,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=662/500000]
+ train/ActionNoiseL2Loss=0.3024
+ throughput/total_tokens=127,104,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=663/500000]
+ train/ActionNoiseL2Loss=0.3426
+ throughput/total_tokens=127,296,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=664/500000]
+ train/ActionNoiseL2Loss=0.4299
+ throughput/total_tokens=127,488,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=665/500000]
+ train/ActionNoiseL2Loss=0.3260
+ throughput/total_tokens=127,680,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=666/500000]
+ train/ActionNoiseL2Loss=0.2412
+ throughput/total_tokens=127,872,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=667/500000]
+ train/ActionNoiseL2Loss=0.3959
+ throughput/total_tokens=128,064,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=668/500000]
+ train/ActionNoiseL2Loss=0.2086
+ throughput/total_tokens=128,256,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=669/500000]
+ train/ActionNoiseL2Loss=0.2452
+ throughput/total_tokens=128,448,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=670/500000]
+ train/ActionNoiseL2Loss=0.3393
+ throughput/total_tokens=128,640,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=671/500000]
+ train/ActionNoiseL2Loss=0.2390
+ throughput/total_tokens=128,832,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=672/500000]
+ train/ActionNoiseL2Loss=0.2263
+ throughput/total_tokens=129,024,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=673/500000]
+ train/ActionNoiseL2Loss=0.2241
+ throughput/total_tokens=129,216,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=674/500000]
+ train/ActionNoiseL2Loss=0.2432
+ throughput/total_tokens=129,408,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=675/500000]
+ train/ActionNoiseL2Loss=0.3258
+ throughput/total_tokens=129,600,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=676/500000]
+ train/ActionNoiseL2Loss=0.2947
+ throughput/total_tokens=129,792,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=677/500000]
+ train/ActionNoiseL2Loss=0.2253
+ throughput/total_tokens=129,984,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=678/500000]
+ train/ActionNoiseL2Loss=0.2075
+ throughput/total_tokens=130,176,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=679/500000]
+ train/ActionNoiseL2Loss=0.2511
+ throughput/total_tokens=130,368,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=680/500000]
+ optim/total_grad_norm=9.835
+ train/ActionNoiseL2Loss=0.3826
+ throughput/total_tokens=130,560,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=681/500000]
+ train/ActionNoiseL2Loss=0.3250
+ throughput/total_tokens=130,752,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=682/500000]
+ train/ActionNoiseL2Loss=0.2524
+ throughput/total_tokens=130,944,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=683/500000]
+ train/ActionNoiseL2Loss=0.1977
+ throughput/total_tokens=131,136,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=684/500000]
+ train/ActionNoiseL2Loss=0.4478
+ throughput/total_tokens=131,328,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=685/500000]
+ train/ActionNoiseL2Loss=0.2329
+ throughput/total_tokens=131,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=686/500000]
+ train/ActionNoiseL2Loss=0.1844
+ throughput/total_tokens=131,712,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=687/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=131,904,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=688/500000]
+ train/ActionNoiseL2Loss=0.2650
+ throughput/total_tokens=132,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=689/500000]
+ train/ActionNoiseL2Loss=0.2342
+ throughput/total_tokens=132,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=690/500000]
+ train/ActionNoiseL2Loss=0.3479
+ throughput/total_tokens=132,480,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=691/500000]
+ train/ActionNoiseL2Loss=0.2174
+ throughput/total_tokens=132,672,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=692/500000]
+ train/ActionNoiseL2Loss=0.3429
+ throughput/total_tokens=132,864,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=693/500000]
+ train/ActionNoiseL2Loss=0.3544
+ throughput/total_tokens=133,056,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=694/500000]
+ train/ActionNoiseL2Loss=0.1855
+ throughput/total_tokens=133,248,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=695/500000]
+ train/ActionNoiseL2Loss=0.1927
+ throughput/total_tokens=133,440,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=696/500000]
+ train/ActionNoiseL2Loss=0.3923
+ throughput/total_tokens=133,632,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=697/500000]
+ train/ActionNoiseL2Loss=0.2354
+ throughput/total_tokens=133,824,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=698/500000]
+ train/ActionNoiseL2Loss=0.2231
+ throughput/total_tokens=134,016,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=699/500000]
+ train/ActionNoiseL2Loss=0.2689
+ throughput/total_tokens=134,208,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=700/500000]
+ optim/total_grad_norm=7.979
+ train/ActionNoiseL2Loss=0.2583
+ throughput/total_tokens=134,400,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=701/500000]
+ train/ActionNoiseL2Loss=0.1537
+ throughput/total_tokens=134,592,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=702/500000]
+ train/ActionNoiseL2Loss=0.3245
+ throughput/total_tokens=134,784,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=703/500000]
+ train/ActionNoiseL2Loss=0.2381
+ throughput/total_tokens=134,976,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=704/500000]
+ train/ActionNoiseL2Loss=0.2367
+ throughput/total_tokens=135,168,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=705/500000]
+ train/ActionNoiseL2Loss=0.2901
+ throughput/total_tokens=135,360,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=706/500000]
+ train/ActionNoiseL2Loss=0.2734
+ throughput/total_tokens=135,552,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=707/500000]
+ train/ActionNoiseL2Loss=0.2891
+ throughput/total_tokens=135,744,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=708/500000]
+ train/ActionNoiseL2Loss=0.2570
+ throughput/total_tokens=135,936,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=709/500000]
+ train/ActionNoiseL2Loss=0.3185
+ throughput/total_tokens=136,128,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=710/500000]
+ train/ActionNoiseL2Loss=0.3525
+ throughput/total_tokens=136,320,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=711/500000]
+ train/ActionNoiseL2Loss=0.2285
+ throughput/total_tokens=136,512,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=712/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=136,704,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=713/500000]
+ train/ActionNoiseL2Loss=0.2566
+ throughput/total_tokens=136,896,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=714/500000]
+ train/ActionNoiseL2Loss=0.2975
+ throughput/total_tokens=137,088,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=715/500000]
+ train/ActionNoiseL2Loss=0.2099
+ throughput/total_tokens=137,280,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=716/500000]
+ train/ActionNoiseL2Loss=0.2021
+ throughput/total_tokens=137,472,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=717/500000]
+ train/ActionNoiseL2Loss=0.2357
+ throughput/total_tokens=137,664,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=718/500000]
+ train/ActionNoiseL2Loss=0.3282
+ throughput/total_tokens=137,856,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=719/500000]
+ train/ActionNoiseL2Loss=0.1799
+ throughput/total_tokens=138,048,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=720/500000]
+ optim/total_grad_norm=5.416
+ train/ActionNoiseL2Loss=0.2435
+ throughput/total_tokens=138,240,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=721/500000]
+ train/ActionNoiseL2Loss=0.2458
+ throughput/total_tokens=138,432,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=722/500000]
+ train/ActionNoiseL2Loss=0.1877
+ throughput/total_tokens=138,624,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=723/500000]
+ train/ActionNoiseL2Loss=0.3508
+ throughput/total_tokens=138,816,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=724/500000]
+ train/ActionNoiseL2Loss=0.2340
+ throughput/total_tokens=139,008,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=725/500000]
+ train/ActionNoiseL2Loss=0.2058
+ throughput/total_tokens=139,200,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=726/500000]
+ train/ActionNoiseL2Loss=0.2282
+ throughput/total_tokens=139,392,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=727/500000]
+ train/ActionNoiseL2Loss=0.2481
+ throughput/total_tokens=139,584,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=728/500000]
+ train/ActionNoiseL2Loss=0.2685
+ throughput/total_tokens=139,776,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=729/500000]
+ train/ActionNoiseL2Loss=0.2129
+ throughput/total_tokens=139,968,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=730/500000]
+ train/ActionNoiseL2Loss=0.2271
+ throughput/total_tokens=140,160,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=731/500000]
+ train/ActionNoiseL2Loss=0.1483
+ throughput/total_tokens=140,352,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=732/500000]
+ train/ActionNoiseL2Loss=0.1941
+ throughput/total_tokens=140,544,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=733/500000]
+ train/ActionNoiseL2Loss=0.2422
+ throughput/total_tokens=140,736,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=734/500000]
+ train/ActionNoiseL2Loss=0.2305
+ throughput/total_tokens=140,928,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=735/500000]
+ train/ActionNoiseL2Loss=0.1588
+ throughput/total_tokens=141,120,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=736/500000]
+ train/ActionNoiseL2Loss=0.2155
+ throughput/total_tokens=141,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=737/500000]
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=141,504,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=738/500000]
+ train/ActionNoiseL2Loss=0.1900
+ throughput/total_tokens=141,696,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=739/500000]
+ train/ActionNoiseL2Loss=0.3233
+ throughput/total_tokens=141,888,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=740/500000]
+ optim/total_grad_norm=5.448
+ train/ActionNoiseL2Loss=0.2274
+ throughput/total_tokens=142,080,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=741/500000]
+ train/ActionNoiseL2Loss=0.3129
+ throughput/total_tokens=142,272,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=742/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=142,464,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=743/500000]
+ train/ActionNoiseL2Loss=0.2578
+ throughput/total_tokens=142,656,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=744/500000]
+ train/ActionNoiseL2Loss=0.2621
+ throughput/total_tokens=142,848,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=745/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=143,040,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=746/500000]
+ train/ActionNoiseL2Loss=0.2082
+ throughput/total_tokens=143,232,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=747/500000]
+ train/ActionNoiseL2Loss=0.2813
+ throughput/total_tokens=143,424,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=748/500000]
+ train/ActionNoiseL2Loss=0.2605
+ throughput/total_tokens=143,616,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=749/500000]
+ train/ActionNoiseL2Loss=0.2694
+ throughput/total_tokens=143,808,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=750/500000]
+ train/ActionNoiseL2Loss=0.2347
+ throughput/total_tokens=144,000,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=751/500000]
+ train/ActionNoiseL2Loss=0.2732
+ throughput/total_tokens=144,192,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=752/500000]
+ train/ActionNoiseL2Loss=0.3297
+ throughput/total_tokens=144,384,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=753/500000]
+ train/ActionNoiseL2Loss=0.2757
+ throughput/total_tokens=144,576,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=754/500000]
+ train/ActionNoiseL2Loss=0.2260
+ throughput/total_tokens=144,768,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=755/500000]
+ train/ActionNoiseL2Loss=0.2018
+ throughput/total_tokens=144,960,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=756/500000]
+ train/ActionNoiseL2Loss=0.2809
+ throughput/total_tokens=145,152,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=757/500000]
+ train/ActionNoiseL2Loss=0.2623
+ throughput/total_tokens=145,344,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=758/500000]
+ train/ActionNoiseL2Loss=0.2043
+ throughput/total_tokens=145,536,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=759/500000]
+ train/ActionNoiseL2Loss=0.2148
+ throughput/total_tokens=145,728,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=760/500000]
+ optim/total_grad_norm=8.802
+ train/ActionNoiseL2Loss=0.4036
+ throughput/total_tokens=145,920,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=761/500000]
+ train/ActionNoiseL2Loss=0.1818
+ throughput/total_tokens=146,112,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=762/500000]
+ train/ActionNoiseL2Loss=0.4094
+ throughput/total_tokens=146,304,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=763/500000]
+ train/ActionNoiseL2Loss=0.2702
+ throughput/total_tokens=146,496,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=764/500000]
+ train/ActionNoiseL2Loss=0.3034
+ throughput/total_tokens=146,688,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=765/500000]
+ train/ActionNoiseL2Loss=0.3291
+ throughput/total_tokens=146,880,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=766/500000]
+ train/ActionNoiseL2Loss=0.3111
+ throughput/total_tokens=147,072,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=767/500000]
+ train/ActionNoiseL2Loss=0.2223
+ throughput/total_tokens=147,264,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=768/500000]
+ train/ActionNoiseL2Loss=0.2767
+ throughput/total_tokens=147,456,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=769/500000]
+ train/ActionNoiseL2Loss=0.2417
+ throughput/total_tokens=147,648,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=770/500000]
+ train/ActionNoiseL2Loss=0.2623
+ throughput/total_tokens=147,840,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=771/500000]
+ train/ActionNoiseL2Loss=0.3102
+ throughput/total_tokens=148,032,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=772/500000]
+ train/ActionNoiseL2Loss=0.2556
+ throughput/total_tokens=148,224,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=773/500000]
+ train/ActionNoiseL2Loss=0.2493
+ throughput/total_tokens=148,416,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=774/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=148,608,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=775/500000]
+ train/ActionNoiseL2Loss=0.1953
+ throughput/total_tokens=148,800,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=776/500000]
+ train/ActionNoiseL2Loss=0.3365
+ throughput/total_tokens=148,992,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=777/500000]
+ train/ActionNoiseL2Loss=0.2602
+ throughput/total_tokens=149,184,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=778/500000]
+ train/ActionNoiseL2Loss=0.3164
+ throughput/total_tokens=149,376,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=779/500000]
+ train/ActionNoiseL2Loss=0.3995
+ throughput/total_tokens=149,568,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=780/500000]
+ optim/total_grad_norm=8.342
+ train/ActionNoiseL2Loss=0.3254
+ throughput/total_tokens=149,760,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=781/500000]
+ train/ActionNoiseL2Loss=0.1930
+ throughput/total_tokens=149,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=782/500000]
+ train/ActionNoiseL2Loss=0.2820
+ throughput/total_tokens=150,144,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=783/500000]
+ train/ActionNoiseL2Loss=0.2748
+ throughput/total_tokens=150,336,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=784/500000]
+ train/ActionNoiseL2Loss=0.3442
+ throughput/total_tokens=150,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=785/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=150,720,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=786/500000]
+ train/ActionNoiseL2Loss=0.1554
+ throughput/total_tokens=150,912,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=787/500000]
+ train/ActionNoiseL2Loss=0.2578
+ throughput/total_tokens=151,104,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=788/500000]
+ train/ActionNoiseL2Loss=0.2260
+ throughput/total_tokens=151,296,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=789/500000]
+ train/ActionNoiseL2Loss=0.2917
+ throughput/total_tokens=151,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=790/500000]
+ train/ActionNoiseL2Loss=0.2771
+ throughput/total_tokens=151,680,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=791/500000]
+ train/ActionNoiseL2Loss=0.3337
+ throughput/total_tokens=151,872,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=792/500000]
+ train/ActionNoiseL2Loss=0.2172
+ throughput/total_tokens=152,064,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=793/500000]
+ train/ActionNoiseL2Loss=0.1840
+ throughput/total_tokens=152,256,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=794/500000]
+ train/ActionNoiseL2Loss=0.2672
+ throughput/total_tokens=152,448,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=795/500000]
+ train/ActionNoiseL2Loss=0.2628
+ throughput/total_tokens=152,640,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=796/500000]
+ train/ActionNoiseL2Loss=0.2991
+ throughput/total_tokens=152,832,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=797/500000]
+ train/ActionNoiseL2Loss=0.1924
+ throughput/total_tokens=153,024,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=798/500000]
+ train/ActionNoiseL2Loss=0.2712
+ throughput/total_tokens=153,216,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=799/500000]
+ train/ActionNoiseL2Loss=0.3670
+ throughput/total_tokens=153,408,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=800/500000]
+ optim/total_grad_norm=6.561
+ train/ActionNoiseL2Loss=0.2030
+ throughput/total_tokens=153,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=801/500000]
+ train/ActionNoiseL2Loss=0.2413
+ throughput/total_tokens=153,792,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=802/500000]
+ train/ActionNoiseL2Loss=0.2205
+ throughput/total_tokens=153,984,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=803/500000]
+ train/ActionNoiseL2Loss=0.2232
+ throughput/total_tokens=154,176,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=804/500000]
+ train/ActionNoiseL2Loss=0.2419
+ throughput/total_tokens=154,368,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=805/500000]
+ train/ActionNoiseL2Loss=0.2016
+ throughput/total_tokens=154,560,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=806/500000]
+ train/ActionNoiseL2Loss=0.2500
+ throughput/total_tokens=154,752,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=807/500000]
+ train/ActionNoiseL2Loss=0.2691
+ throughput/total_tokens=154,944,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=808/500000]
+ train/ActionNoiseL2Loss=0.2126
+ throughput/total_tokens=155,136,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=809/500000]
+ train/ActionNoiseL2Loss=0.1884
+ throughput/total_tokens=155,328,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=810/500000]
+ train/ActionNoiseL2Loss=0.2066
+ throughput/total_tokens=155,520,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=811/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=155,712,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=812/500000]
+ train/ActionNoiseL2Loss=0.3527
+ throughput/total_tokens=155,904,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=813/500000]
+ train/ActionNoiseL2Loss=0.2357
+ throughput/total_tokens=156,096,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=814/500000]
+ train/ActionNoiseL2Loss=0.1875
+ throughput/total_tokens=156,288,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=815/500000]
+ train/ActionNoiseL2Loss=0.2330
+ throughput/total_tokens=156,480,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=816/500000]
+ train/ActionNoiseL2Loss=0.3079
+ throughput/total_tokens=156,672,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=817/500000]
+ train/ActionNoiseL2Loss=0.3100
+ throughput/total_tokens=156,864,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=818/500000]
+ train/ActionNoiseL2Loss=0.2881
+ throughput/total_tokens=157,056,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=819/500000]
+ train/ActionNoiseL2Loss=0.1745
+ throughput/total_tokens=157,248,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=820/500000]
+ optim/total_grad_norm=6.135
+ train/ActionNoiseL2Loss=0.2008
+ throughput/total_tokens=157,440,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=821/500000]
+ train/ActionNoiseL2Loss=0.3142
+ throughput/total_tokens=157,632,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=822/500000]
+ train/ActionNoiseL2Loss=0.2169
+ throughput/total_tokens=157,824,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=823/500000]
+ train/ActionNoiseL2Loss=0.2652
+ throughput/total_tokens=158,016,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=824/500000]
+ train/ActionNoiseL2Loss=0.2431
+ throughput/total_tokens=158,208,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=825/500000]
+ train/ActionNoiseL2Loss=0.2607
+ throughput/total_tokens=158,400,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=826/500000]
+ train/ActionNoiseL2Loss=0.2572
+ throughput/total_tokens=158,592,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=827/500000]
+ train/ActionNoiseL2Loss=0.3066
+ throughput/total_tokens=158,784,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=828/500000]
+ train/ActionNoiseL2Loss=0.2269
+ throughput/total_tokens=158,976,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=829/500000]
+ train/ActionNoiseL2Loss=0.2526
+ throughput/total_tokens=159,168,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=830/500000]
+ train/ActionNoiseL2Loss=0.2406
+ throughput/total_tokens=159,360,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=831/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=159,552,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=832/500000]
+ train/ActionNoiseL2Loss=0.1812
+ throughput/total_tokens=159,744,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=833/500000]
+ train/ActionNoiseL2Loss=0.2977
+ throughput/total_tokens=159,936,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=834/500000]
+ train/ActionNoiseL2Loss=0.3535
+ throughput/total_tokens=160,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=835/500000]
+ train/ActionNoiseL2Loss=0.2288
+ throughput/total_tokens=160,320,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=836/500000]
+ train/ActionNoiseL2Loss=0.1917
+ throughput/total_tokens=160,512,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=837/500000]
+ train/ActionNoiseL2Loss=0.2699
+ throughput/total_tokens=160,704,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=838/500000]
+ train/ActionNoiseL2Loss=0.1887
+ throughput/total_tokens=160,896,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=839/500000]
+ train/ActionNoiseL2Loss=0.2689
+ throughput/total_tokens=161,088,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=840/500000]
+ optim/total_grad_norm=5.276
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=161,280,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=841/500000]
+ train/ActionNoiseL2Loss=0.2995
+ throughput/total_tokens=161,472,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=842/500000]
+ train/ActionNoiseL2Loss=0.2184
+ throughput/total_tokens=161,664,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=843/500000]
+ train/ActionNoiseL2Loss=0.1912
+ throughput/total_tokens=161,856,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=844/500000]
+ train/ActionNoiseL2Loss=0.2803
+ throughput/total_tokens=162,048,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=845/500000]
+ train/ActionNoiseL2Loss=0.2208
+ throughput/total_tokens=162,240,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=846/500000]
+ train/ActionNoiseL2Loss=0.2631
+ throughput/total_tokens=162,432,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=847/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=162,624,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=848/500000]
+ train/ActionNoiseL2Loss=0.2181
+ throughput/total_tokens=162,816,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=849/500000]
+ train/ActionNoiseL2Loss=0.2849
+ throughput/total_tokens=163,008,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=850/500000]
+ train/ActionNoiseL2Loss=0.2013
+ throughput/total_tokens=163,200,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=851/500000]
+ train/ActionNoiseL2Loss=0.1997
+ throughput/total_tokens=163,392,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=852/500000]
+ train/ActionNoiseL2Loss=0.2657
+ throughput/total_tokens=163,584,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=853/500000]
+ train/ActionNoiseL2Loss=0.2046
+ throughput/total_tokens=163,776,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=854/500000]
+ train/ActionNoiseL2Loss=0.3247
+ throughput/total_tokens=163,968,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=855/500000]
+ train/ActionNoiseL2Loss=0.4385
+ throughput/total_tokens=164,160,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=856/500000]
+ train/ActionNoiseL2Loss=0.3348
+ throughput/total_tokens=164,352,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=857/500000]
+ train/ActionNoiseL2Loss=0.2319
+ throughput/total_tokens=164,544,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=858/500000]
+ train/ActionNoiseL2Loss=0.1870
+ throughput/total_tokens=164,736,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=859/500000]
+ train/ActionNoiseL2Loss=0.4121
+ throughput/total_tokens=164,928,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=860/500000]
+ optim/total_grad_norm=7.486
+ train/ActionNoiseL2Loss=0.2676
+ throughput/total_tokens=165,120,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=861/500000]
+ train/ActionNoiseL2Loss=0.3332
+ throughput/total_tokens=165,312,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=862/500000]
+ train/ActionNoiseL2Loss=0.2727
+ throughput/total_tokens=165,504,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=863/500000]
+ train/ActionNoiseL2Loss=0.3737
+ throughput/total_tokens=165,696,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=864/500000]
+ train/ActionNoiseL2Loss=0.3117
+ throughput/total_tokens=165,888,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=865/500000]
+ train/ActionNoiseL2Loss=0.3073
+ throughput/total_tokens=166,080,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=866/500000]
+ train/ActionNoiseL2Loss=0.4775
+ throughput/total_tokens=166,272,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=867/500000]
+ train/ActionNoiseL2Loss=0.3213
+ throughput/total_tokens=166,464,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=868/500000]
+ train/ActionNoiseL2Loss=0.3004
+ throughput/total_tokens=166,656,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=869/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=166,848,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=870/500000]
+ train/ActionNoiseL2Loss=0.2598
+ throughput/total_tokens=167,040,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=871/500000]
+ train/ActionNoiseL2Loss=0.1703
+ throughput/total_tokens=167,232,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=872/500000]
+ train/ActionNoiseL2Loss=0.3176
+ throughput/total_tokens=167,424,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=873/500000]
+ train/ActionNoiseL2Loss=0.2103
+ throughput/total_tokens=167,616,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=874/500000]
+ train/ActionNoiseL2Loss=0.1815
+ throughput/total_tokens=167,808,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=875/500000]
+ train/ActionNoiseL2Loss=0.1827
+ throughput/total_tokens=168,000,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=876/500000]
+ train/ActionNoiseL2Loss=0.2212
+ throughput/total_tokens=168,192,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=877/500000]
+ train/ActionNoiseL2Loss=0.2840
+ throughput/total_tokens=168,384,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=878/500000]
+ train/ActionNoiseL2Loss=0.2488
+ throughput/total_tokens=168,576,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=879/500000]
+ train/ActionNoiseL2Loss=0.2068
+ throughput/total_tokens=168,768,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=880/500000]
+ optim/total_grad_norm=6.435
+ train/ActionNoiseL2Loss=0.2493
+ throughput/total_tokens=168,960,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=881/500000]
+ train/ActionNoiseL2Loss=0.2532
+ throughput/total_tokens=169,152,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=882/500000]
+ train/ActionNoiseL2Loss=0.2676
+ throughput/total_tokens=169,344,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=883/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=169,536,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=884/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=169,728,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=885/500000]
+ train/ActionNoiseL2Loss=0.2225
+ throughput/total_tokens=169,920,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=886/500000]
+ train/ActionNoiseL2Loss=0.1920
+ throughput/total_tokens=170,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=887/500000]
+ train/ActionNoiseL2Loss=0.2282
+ throughput/total_tokens=170,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=888/500000]
+ train/ActionNoiseL2Loss=0.2982
+ throughput/total_tokens=170,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=889/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=170,688,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=890/500000]
+ train/ActionNoiseL2Loss=0.2326
+ throughput/total_tokens=170,880,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=891/500000]
+ train/ActionNoiseL2Loss=0.2536
+ throughput/total_tokens=171,072,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=892/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=171,264,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=893/500000]
+ train/ActionNoiseL2Loss=0.1659
+ throughput/total_tokens=171,456,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=894/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=171,648,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=895/500000]
+ train/ActionNoiseL2Loss=0.2293
+ throughput/total_tokens=171,840,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=896/500000]
+ train/ActionNoiseL2Loss=0.2192
+ throughput/total_tokens=172,032,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=897/500000]
+ train/ActionNoiseL2Loss=0.2645
+ throughput/total_tokens=172,224,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=898/500000]
+ train/ActionNoiseL2Loss=0.1858
+ throughput/total_tokens=172,416,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=899/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=172,608,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=900/500000]
+ optim/total_grad_norm=3.762
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=172,800,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=901/500000]
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=172,992,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=902/500000]
+ train/ActionNoiseL2Loss=0.2957
+ throughput/total_tokens=173,184,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=903/500000]
+ train/ActionNoiseL2Loss=0.1776
+ throughput/total_tokens=173,376,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=904/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=173,568,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=905/500000]
+ train/ActionNoiseL2Loss=0.1988
+ throughput/total_tokens=173,760,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=906/500000]
+ train/ActionNoiseL2Loss=0.2214
+ throughput/total_tokens=173,952,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=907/500000]
+ train/ActionNoiseL2Loss=0.1910
+ throughput/total_tokens=174,144,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=908/500000]
+ train/ActionNoiseL2Loss=0.1709
+ throughput/total_tokens=174,336,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=909/500000]
+ train/ActionNoiseL2Loss=0.2233
+ throughput/total_tokens=174,528,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=910/500000]
+ train/ActionNoiseL2Loss=0.1792
+ throughput/total_tokens=174,720,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=911/500000]
+ train/ActionNoiseL2Loss=0.1846
+ throughput/total_tokens=174,912,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=912/500000]
+ train/ActionNoiseL2Loss=0.1719
+ throughput/total_tokens=175,104,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=913/500000]
+ train/ActionNoiseL2Loss=0.2292
+ throughput/total_tokens=175,296,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=914/500000]
+ train/ActionNoiseL2Loss=0.2476
+ throughput/total_tokens=175,488,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=915/500000]
+ train/ActionNoiseL2Loss=0.2780
+ throughput/total_tokens=175,680,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=916/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=175,872,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=917/500000]
+ train/ActionNoiseL2Loss=0.2390
+ throughput/total_tokens=176,064,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=918/500000]
+ train/ActionNoiseL2Loss=0.1917
+ throughput/total_tokens=176,256,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=919/500000]
+ train/ActionNoiseL2Loss=0.2078
+ throughput/total_tokens=176,448,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=920/500000]
+ optim/total_grad_norm=5.115
+ train/ActionNoiseL2Loss=0.1584
+ throughput/total_tokens=176,640,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=921/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=176,832,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=922/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=177,024,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=923/500000]
+ train/ActionNoiseL2Loss=0.2438
+ throughput/total_tokens=177,216,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=924/500000]
+ train/ActionNoiseL2Loss=0.1749
+ throughput/total_tokens=177,408,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=925/500000]
+ train/ActionNoiseL2Loss=0.2029
+ throughput/total_tokens=177,600,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=926/500000]
+ train/ActionNoiseL2Loss=0.2361
+ throughput/total_tokens=177,792,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=927/500000]
+ train/ActionNoiseL2Loss=0.2547
+ throughput/total_tokens=177,984,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=928/500000]
+ train/ActionNoiseL2Loss=0.1982
+ throughput/total_tokens=178,176,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=929/500000]
+ train/ActionNoiseL2Loss=0.2269
+ throughput/total_tokens=178,368,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=930/500000]
+ train/ActionNoiseL2Loss=0.2425
+ throughput/total_tokens=178,560,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=931/500000]
+ train/ActionNoiseL2Loss=0.2983
+ throughput/total_tokens=178,752,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=932/500000]
+ train/ActionNoiseL2Loss=0.2306
+ throughput/total_tokens=178,944,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=933/500000]
+ train/ActionNoiseL2Loss=0.3116
+ throughput/total_tokens=179,136,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=934/500000]
+ train/ActionNoiseL2Loss=0.2747
+ throughput/total_tokens=179,328,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=935/500000]
+ train/ActionNoiseL2Loss=0.2493
+ throughput/total_tokens=179,520,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=936/500000]
+ train/ActionNoiseL2Loss=0.2775
+ throughput/total_tokens=179,712,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=937/500000]
+ train/ActionNoiseL2Loss=0.1662
+ throughput/total_tokens=179,904,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=938/500000]
+ train/ActionNoiseL2Loss=0.1936
+ throughput/total_tokens=180,096,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=939/500000]
+ train/ActionNoiseL2Loss=0.2047
+ throughput/total_tokens=180,288,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=940/500000]
+ optim/total_grad_norm=6.075
+ train/ActionNoiseL2Loss=0.2232
+ throughput/total_tokens=180,480,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=941/500000]
+ train/ActionNoiseL2Loss=0.2602
+ throughput/total_tokens=180,672,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=942/500000]
+ train/ActionNoiseL2Loss=0.4131
+ throughput/total_tokens=180,864,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=943/500000]
+ train/ActionNoiseL2Loss=0.2035
+ throughput/total_tokens=181,056,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=944/500000]
+ train/ActionNoiseL2Loss=0.2187
+ throughput/total_tokens=181,248,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=945/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=181,440,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=946/500000]
+ train/ActionNoiseL2Loss=0.2365
+ throughput/total_tokens=181,632,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=947/500000]
+ train/ActionNoiseL2Loss=0.2422
+ throughput/total_tokens=181,824,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=948/500000]
+ train/ActionNoiseL2Loss=0.2525
+ throughput/total_tokens=182,016,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=949/500000]
+ train/ActionNoiseL2Loss=0.2103
+ throughput/total_tokens=182,208,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=950/500000]
+ train/ActionNoiseL2Loss=0.2462
+ throughput/total_tokens=182,400,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=951/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=182,592,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=952/500000]
+ train/ActionNoiseL2Loss=0.1661
+ throughput/total_tokens=182,784,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=953/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=182,976,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=954/500000]
+ train/ActionNoiseL2Loss=0.2341
+ throughput/total_tokens=183,168,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=955/500000]
+ train/ActionNoiseL2Loss=0.1702
+ throughput/total_tokens=183,360,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=956/500000]
+ train/ActionNoiseL2Loss=0.3213
+ throughput/total_tokens=183,552,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=957/500000]
+ train/ActionNoiseL2Loss=0.2586
+ throughput/total_tokens=183,744,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=958/500000]
+ train/ActionNoiseL2Loss=0.3470
+ throughput/total_tokens=183,936,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=959/500000]
+ train/ActionNoiseL2Loss=0.1824
+ throughput/total_tokens=184,128,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=960/500000]
+ optim/total_grad_norm=5.976
+ train/ActionNoiseL2Loss=0.2164
+ throughput/total_tokens=184,320,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=961/500000]
+ train/ActionNoiseL2Loss=0.2035
+ throughput/total_tokens=184,512,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=962/500000]
+ train/ActionNoiseL2Loss=0.2039
+ throughput/total_tokens=184,704,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=963/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=184,896,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=964/500000]
+ train/ActionNoiseL2Loss=0.2737
+ throughput/total_tokens=185,088,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=965/500000]
+ train/ActionNoiseL2Loss=0.2138
+ throughput/total_tokens=185,280,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=966/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=185,472,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=967/500000]
+ train/ActionNoiseL2Loss=0.3223
+ throughput/total_tokens=185,664,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=968/500000]
+ train/ActionNoiseL2Loss=0.2433
+ throughput/total_tokens=185,856,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=969/500000]
+ train/ActionNoiseL2Loss=0.2538
+ throughput/total_tokens=186,048,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=970/500000]
+ train/ActionNoiseL2Loss=0.3534
+ throughput/total_tokens=186,240,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=971/500000]
+ train/ActionNoiseL2Loss=0.2235
+ throughput/total_tokens=186,432,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=972/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=186,624,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=973/500000]
+ train/ActionNoiseL2Loss=0.2220
+ throughput/total_tokens=186,816,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=974/500000]
+ train/ActionNoiseL2Loss=0.2419
+ throughput/total_tokens=187,008,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=975/500000]
+ train/ActionNoiseL2Loss=0.2659
+ throughput/total_tokens=187,200,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=976/500000]
+ train/ActionNoiseL2Loss=0.2287
+ throughput/total_tokens=187,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=977/500000]
+ train/ActionNoiseL2Loss=0.2063
+ throughput/total_tokens=187,584,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=978/500000]
+ train/ActionNoiseL2Loss=0.2648
+ throughput/total_tokens=187,776,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=979/500000]
+ train/ActionNoiseL2Loss=0.1623
+ throughput/total_tokens=187,968,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=980/500000]
+ optim/total_grad_norm=6.305
+ train/ActionNoiseL2Loss=0.1774
+ throughput/total_tokens=188,160,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=981/500000]
+ train/ActionNoiseL2Loss=0.2864
+ throughput/total_tokens=188,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=982/500000]
+ train/ActionNoiseL2Loss=0.1873
+ throughput/total_tokens=188,544,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=983/500000]
+ train/ActionNoiseL2Loss=0.1927
+ throughput/total_tokens=188,736,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=984/500000]
+ train/ActionNoiseL2Loss=0.2069
+ throughput/total_tokens=188,928,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=985/500000]
+ train/ActionNoiseL2Loss=0.1750
+ throughput/total_tokens=189,120,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=986/500000]
+ train/ActionNoiseL2Loss=0.2155
+ throughput/total_tokens=189,312,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=987/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=189,504,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=988/500000]
+ train/ActionNoiseL2Loss=0.2053
+ throughput/total_tokens=189,696,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=989/500000]
+ train/ActionNoiseL2Loss=0.3031
+ throughput/total_tokens=189,888,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=990/500000]
+ train/ActionNoiseL2Loss=0.1851
+ throughput/total_tokens=190,080,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=991/500000]
+ train/ActionNoiseL2Loss=0.1985
+ throughput/total_tokens=190,272,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=992/500000]
+ train/ActionNoiseL2Loss=0.1919
+ throughput/total_tokens=190,464,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=993/500000]
+ train/ActionNoiseL2Loss=0.2373
+ throughput/total_tokens=190,656,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=994/500000]
+ train/ActionNoiseL2Loss=0.3134
+ throughput/total_tokens=190,848,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=995/500000]
+ train/ActionNoiseL2Loss=0.1792
+ throughput/total_tokens=191,040,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=996/500000]
+ train/ActionNoiseL2Loss=0.3231
+ throughput/total_tokens=191,232,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=997/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=191,424,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=998/500000]
+ train/ActionNoiseL2Loss=0.2309
+ throughput/total_tokens=191,616,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=999/500000]
+ train/ActionNoiseL2Loss=0.1473
+ throughput/total_tokens=191,808,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1000/500000]
+ optim/total_grad_norm=7.855
+ train/ActionNoiseL2Loss=0.2846
+ throughput/total_tokens=192,000,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+09/28 [16:53:49] INFO | >> Saving config... checkpoint.py:608
+09/28 [16:54:20] INFO | >> Saving model state... checkpoint.py:796
+09/28 [16:55:23] INFO | >> Saving optim state... checkpoint.py:811
+09/28 [16:55:28] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1001/500000]
+ train/ActionNoiseL2Loss=0.3146
+ throughput/total_tokens=192,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1002/500000]
+ train/ActionNoiseL2Loss=0.2411
+ throughput/total_tokens=192,384,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=1003/500000]
+ train/ActionNoiseL2Loss=0.1906
+ throughput/total_tokens=192,576,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=1004/500000]
+ train/ActionNoiseL2Loss=0.2147
+ throughput/total_tokens=192,768,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=1005/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=192,960,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=1006/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=193,152,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=1007/500000]
+ train/ActionNoiseL2Loss=0.1706
+ throughput/total_tokens=193,344,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=1008/500000]
+ train/ActionNoiseL2Loss=0.2299
+ throughput/total_tokens=193,536,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=1009/500000]
+ train/ActionNoiseL2Loss=0.1944
+ throughput/total_tokens=193,728,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1010/500000]
+ train/ActionNoiseL2Loss=0.2191
+ throughput/total_tokens=193,920,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1011/500000]
+ train/ActionNoiseL2Loss=0.2277
+ throughput/total_tokens=194,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1012/500000]
+ train/ActionNoiseL2Loss=0.3264
+ throughput/total_tokens=194,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1013/500000]
+ train/ActionNoiseL2Loss=0.2256
+ throughput/total_tokens=194,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1014/500000]
+ train/ActionNoiseL2Loss=0.2514
+ throughput/total_tokens=194,688,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1015/500000]
+ train/ActionNoiseL2Loss=0.2290
+ throughput/total_tokens=194,880,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1016/500000]
+ train/ActionNoiseL2Loss=0.2688
+ throughput/total_tokens=195,072,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1017/500000]
+ train/ActionNoiseL2Loss=0.3234
+ throughput/total_tokens=195,264,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1018/500000]
+ train/ActionNoiseL2Loss=0.2174
+ throughput/total_tokens=195,456,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1019/500000]
+ train/ActionNoiseL2Loss=0.2043
+ throughput/total_tokens=195,648,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1020/500000]
+ optim/total_grad_norm=4.049
+ train/ActionNoiseL2Loss=0.2277
+ throughput/total_tokens=195,840,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1021/500000]
+ train/ActionNoiseL2Loss=0.2519
+ throughput/total_tokens=196,032,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1022/500000]
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=196,224,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1023/500000]
+ train/ActionNoiseL2Loss=0.1715
+ throughput/total_tokens=196,416,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1024/500000]
+ train/ActionNoiseL2Loss=0.1624
+ throughput/total_tokens=196,608,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1025/500000]
+ train/ActionNoiseL2Loss=0.2047
+ throughput/total_tokens=196,800,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1026/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=196,992,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1027/500000]
+ train/ActionNoiseL2Loss=0.1523
+ throughput/total_tokens=197,184,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1028/500000]
+ train/ActionNoiseL2Loss=0.2514
+ throughput/total_tokens=197,376,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1029/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=197,568,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1030/500000]
+ train/ActionNoiseL2Loss=0.1862
+ throughput/total_tokens=197,760,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1031/500000]
+ train/ActionNoiseL2Loss=0.2742
+ throughput/total_tokens=197,952,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1032/500000]
+ train/ActionNoiseL2Loss=0.2197
+ throughput/total_tokens=198,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1033/500000]
+ train/ActionNoiseL2Loss=0.2354
+ throughput/total_tokens=198,336,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1034/500000]
+ train/ActionNoiseL2Loss=0.1807
+ throughput/total_tokens=198,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1035/500000]
+ train/ActionNoiseL2Loss=0.1459
+ throughput/total_tokens=198,720,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1036/500000]
+ train/ActionNoiseL2Loss=0.1677
+ throughput/total_tokens=198,912,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1037/500000]
+ train/ActionNoiseL2Loss=0.2119
+ throughput/total_tokens=199,104,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1038/500000]
+ train/ActionNoiseL2Loss=0.2194
+ throughput/total_tokens=199,296,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1039/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=199,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1040/500000]
+ optim/total_grad_norm=5.037
+ train/ActionNoiseL2Loss=0.2132
+ throughput/total_tokens=199,680,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1041/500000]
+ train/ActionNoiseL2Loss=0.2842
+ throughput/total_tokens=199,872,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1042/500000]
+ train/ActionNoiseL2Loss=0.2077
+ throughput/total_tokens=200,064,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1043/500000]
+ train/ActionNoiseL2Loss=0.2276
+ throughput/total_tokens=200,256,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1044/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=200,448,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1045/500000]
+ train/ActionNoiseL2Loss=0.1979
+ throughput/total_tokens=200,640,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1046/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=200,832,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1047/500000]
+ train/ActionNoiseL2Loss=0.3086
+ throughput/total_tokens=201,024,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1048/500000]
+ train/ActionNoiseL2Loss=0.2224
+ throughput/total_tokens=201,216,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1049/500000]
+ train/ActionNoiseL2Loss=0.1992
+ throughput/total_tokens=201,408,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1050/500000]
+ train/ActionNoiseL2Loss=0.2090
+ throughput/total_tokens=201,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1051/500000]
+ train/ActionNoiseL2Loss=0.1444
+ throughput/total_tokens=201,792,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1052/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=201,984,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1053/500000]
+ train/ActionNoiseL2Loss=0.1662
+ throughput/total_tokens=202,176,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1054/500000]
+ train/ActionNoiseL2Loss=0.1996
+ throughput/total_tokens=202,368,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1055/500000]
+ train/ActionNoiseL2Loss=0.1492
+ throughput/total_tokens=202,560,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1056/500000]
+ train/ActionNoiseL2Loss=0.3086
+ throughput/total_tokens=202,752,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1057/500000]
+ train/ActionNoiseL2Loss=0.1554
+ throughput/total_tokens=202,944,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1058/500000]
+ train/ActionNoiseL2Loss=0.1587
+ throughput/total_tokens=203,136,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1059/500000]
+ train/ActionNoiseL2Loss=0.2738
+ throughput/total_tokens=203,328,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1060/500000]
+ optim/total_grad_norm=4.957
+ train/ActionNoiseL2Loss=0.1936
+ throughput/total_tokens=203,520,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1061/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=203,712,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1062/500000]
+ train/ActionNoiseL2Loss=0.3110
+ throughput/total_tokens=203,904,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1063/500000]
+ train/ActionNoiseL2Loss=0.1665
+ throughput/total_tokens=204,096,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1064/500000]
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=204,288,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1065/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=204,480,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1066/500000]
+ train/ActionNoiseL2Loss=0.1901
+ throughput/total_tokens=204,672,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1067/500000]
+ train/ActionNoiseL2Loss=0.3061
+ throughput/total_tokens=204,864,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1068/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=205,056,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1069/500000]
+ train/ActionNoiseL2Loss=0.3356
+ throughput/total_tokens=205,248,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1070/500000]
+ train/ActionNoiseL2Loss=0.1580
+ throughput/total_tokens=205,440,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1071/500000]
+ train/ActionNoiseL2Loss=0.2381
+ throughput/total_tokens=205,632,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1072/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=205,824,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1073/500000]
+ train/ActionNoiseL2Loss=0.1738
+ throughput/total_tokens=206,016,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1074/500000]
+ train/ActionNoiseL2Loss=0.1942
+ throughput/total_tokens=206,208,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1075/500000]
+ train/ActionNoiseL2Loss=0.2314
+ throughput/total_tokens=206,400,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1076/500000]
+ train/ActionNoiseL2Loss=0.2529
+ throughput/total_tokens=206,592,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1077/500000]
+ train/ActionNoiseL2Loss=0.2178
+ throughput/total_tokens=206,784,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1078/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=206,976,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1079/500000]
+ train/ActionNoiseL2Loss=0.2067
+ throughput/total_tokens=207,168,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1080/500000]
+ optim/total_grad_norm=7.586
+ train/ActionNoiseL2Loss=0.2618
+ throughput/total_tokens=207,360,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1081/500000]
+ train/ActionNoiseL2Loss=0.2728
+ throughput/total_tokens=207,552,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1082/500000]
+ train/ActionNoiseL2Loss=0.2400
+ throughput/total_tokens=207,744,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1083/500000]
+ train/ActionNoiseL2Loss=0.2759
+ throughput/total_tokens=207,936,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1084/500000]
+ train/ActionNoiseL2Loss=0.2631
+ throughput/total_tokens=208,128,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1085/500000]
+ train/ActionNoiseL2Loss=0.2070
+ throughput/total_tokens=208,320,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1086/500000]
+ train/ActionNoiseL2Loss=0.2872
+ throughput/total_tokens=208,512,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1087/500000]
+ train/ActionNoiseL2Loss=0.2242
+ throughput/total_tokens=208,704,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1088/500000]
+ train/ActionNoiseL2Loss=0.2466
+ throughput/total_tokens=208,896,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1089/500000]
+ train/ActionNoiseL2Loss=0.2594
+ throughput/total_tokens=209,088,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1090/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=209,280,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1091/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=209,472,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1092/500000]
+ train/ActionNoiseL2Loss=0.2142
+ throughput/total_tokens=209,664,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1093/500000]
+ train/ActionNoiseL2Loss=0.2825
+ throughput/total_tokens=209,856,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1094/500000]
+ train/ActionNoiseL2Loss=0.3095
+ throughput/total_tokens=210,048,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1095/500000]
+ train/ActionNoiseL2Loss=0.2800
+ throughput/total_tokens=210,240,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1096/500000]
+ train/ActionNoiseL2Loss=0.2165
+ throughput/total_tokens=210,432,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1097/500000]
+ train/ActionNoiseL2Loss=0.2025
+ throughput/total_tokens=210,624,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1098/500000]
+ train/ActionNoiseL2Loss=0.1831
+ throughput/total_tokens=210,816,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1099/500000]
+ train/ActionNoiseL2Loss=0.1761
+ throughput/total_tokens=211,008,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1100/500000]
+ optim/total_grad_norm=3.741
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=211,200,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1101/500000]
+ train/ActionNoiseL2Loss=0.2935
+ throughput/total_tokens=211,392,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1102/500000]
+ train/ActionNoiseL2Loss=0.1727
+ throughput/total_tokens=211,584,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1103/500000]
+ train/ActionNoiseL2Loss=0.2536
+ throughput/total_tokens=211,776,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1104/500000]
+ train/ActionNoiseL2Loss=0.1841
+ throughput/total_tokens=211,968,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1105/500000]
+ train/ActionNoiseL2Loss=0.2159
+ throughput/total_tokens=212,160,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1106/500000]
+ train/ActionNoiseL2Loss=0.4070
+ throughput/total_tokens=212,352,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1107/500000]
+ train/ActionNoiseL2Loss=0.1971
+ throughput/total_tokens=212,544,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1108/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=212,736,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1109/500000]
+ train/ActionNoiseL2Loss=0.1905
+ throughput/total_tokens=212,928,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1110/500000]
+ train/ActionNoiseL2Loss=0.2187
+ throughput/total_tokens=213,120,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,539
+[step=1111/500000]
+ train/ActionNoiseL2Loss=0.2096
+ throughput/total_tokens=213,312,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1112/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=213,504,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1113/500000]
+ train/ActionNoiseL2Loss=0.2591
+ throughput/total_tokens=213,696,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1114/500000]
+ train/ActionNoiseL2Loss=0.2501
+ throughput/total_tokens=213,888,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1115/500000]
+ train/ActionNoiseL2Loss=0.3157
+ throughput/total_tokens=214,080,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1116/500000]
+ train/ActionNoiseL2Loss=0.3335
+ throughput/total_tokens=214,272,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1117/500000]
+ train/ActionNoiseL2Loss=0.1793
+ throughput/total_tokens=214,464,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1118/500000]
+ train/ActionNoiseL2Loss=0.2959
+ throughput/total_tokens=214,656,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1119/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=214,848,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1120/500000]
+ optim/total_grad_norm=6.131
+ train/ActionNoiseL2Loss=0.2081
+ throughput/total_tokens=215,040,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1121/500000]
+ train/ActionNoiseL2Loss=0.2288
+ throughput/total_tokens=215,232,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1122/500000]
+ train/ActionNoiseL2Loss=0.2025
+ throughput/total_tokens=215,424,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1123/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=215,616,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1124/500000]
+ train/ActionNoiseL2Loss=0.3337
+ throughput/total_tokens=215,808,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1125/500000]
+ train/ActionNoiseL2Loss=0.2020
+ throughput/total_tokens=216,000,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1126/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=216,192,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1127/500000]
+ train/ActionNoiseL2Loss=0.1754
+ throughput/total_tokens=216,384,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1128/500000]
+ train/ActionNoiseL2Loss=0.1921
+ throughput/total_tokens=216,576,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1129/500000]
+ train/ActionNoiseL2Loss=0.2246
+ throughput/total_tokens=216,768,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1130/500000]
+ train/ActionNoiseL2Loss=0.2262
+ throughput/total_tokens=216,960,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1131/500000]
+ train/ActionNoiseL2Loss=0.2351
+ throughput/total_tokens=217,152,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1132/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=217,344,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1133/500000]
+ train/ActionNoiseL2Loss=0.2134
+ throughput/total_tokens=217,536,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1134/500000]
+ train/ActionNoiseL2Loss=0.2343
+ throughput/total_tokens=217,728,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1135/500000]
+ train/ActionNoiseL2Loss=0.2117
+ throughput/total_tokens=217,920,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1136/500000]
+ train/ActionNoiseL2Loss=0.1984
+ throughput/total_tokens=218,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1137/500000]
+ train/ActionNoiseL2Loss=0.1371
+ throughput/total_tokens=218,304,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1138/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=218,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1139/500000]
+ train/ActionNoiseL2Loss=0.1715
+ throughput/total_tokens=218,688,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1140/500000]
+ optim/total_grad_norm=6.509
+ train/ActionNoiseL2Loss=0.3528
+ throughput/total_tokens=218,880,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1141/500000]
+ train/ActionNoiseL2Loss=0.3565
+ throughput/total_tokens=219,072,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1142/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=219,264,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1143/500000]
+ train/ActionNoiseL2Loss=0.1859
+ throughput/total_tokens=219,456,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1144/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=219,648,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1145/500000]
+ train/ActionNoiseL2Loss=0.2957
+ throughput/total_tokens=219,840,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1146/500000]
+ train/ActionNoiseL2Loss=0.3450
+ throughput/total_tokens=220,032,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1147/500000]
+ train/ActionNoiseL2Loss=0.2904
+ throughput/total_tokens=220,224,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1148/500000]
+ train/ActionNoiseL2Loss=0.2355
+ throughput/total_tokens=220,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1149/500000]
+ train/ActionNoiseL2Loss=0.2786
+ throughput/total_tokens=220,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1150/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=220,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1151/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=220,992,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1152/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=221,184,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1153/500000]
+ train/ActionNoiseL2Loss=0.2182
+ throughput/total_tokens=221,376,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1154/500000]
+ train/ActionNoiseL2Loss=0.1958
+ throughput/total_tokens=221,568,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1155/500000]
+ train/ActionNoiseL2Loss=0.2605
+ throughput/total_tokens=221,760,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1156/500000]
+ train/ActionNoiseL2Loss=0.3521
+ throughput/total_tokens=221,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1157/500000]
+ train/ActionNoiseL2Loss=0.2900
+ throughput/total_tokens=222,144,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1158/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=222,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1159/500000]
+ train/ActionNoiseL2Loss=0.1588
+ throughput/total_tokens=222,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1160/500000]
+ optim/total_grad_norm=3.778
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=222,720,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1161/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=222,912,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1162/500000]
+ train/ActionNoiseL2Loss=0.2514
+ throughput/total_tokens=223,104,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1163/500000]
+ train/ActionNoiseL2Loss=0.2397
+ throughput/total_tokens=223,296,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1164/500000]
+ train/ActionNoiseL2Loss=0.1601
+ throughput/total_tokens=223,488,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1165/500000]
+ train/ActionNoiseL2Loss=0.2173
+ throughput/total_tokens=223,680,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1166/500000]
+ train/ActionNoiseL2Loss=0.1597
+ throughput/total_tokens=223,872,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1167/500000]
+ train/ActionNoiseL2Loss=0.2521
+ throughput/total_tokens=224,064,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1168/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=224,256,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1169/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=224,448,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1170/500000]
+ train/ActionNoiseL2Loss=0.1996
+ throughput/total_tokens=224,640,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1171/500000]
+ train/ActionNoiseL2Loss=0.4186
+ throughput/total_tokens=224,832,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1172/500000]
+ train/ActionNoiseL2Loss=0.1803
+ throughput/total_tokens=225,024,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1173/500000]
+ train/ActionNoiseL2Loss=0.1931
+ throughput/total_tokens=225,216,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1174/500000]
+ train/ActionNoiseL2Loss=0.2982
+ throughput/total_tokens=225,408,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1175/500000]
+ train/ActionNoiseL2Loss=0.1833
+ throughput/total_tokens=225,600,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1176/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=225,792,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1177/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=225,984,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1178/500000]
+ train/ActionNoiseL2Loss=0.1945
+ throughput/total_tokens=226,176,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1179/500000]
+ train/ActionNoiseL2Loss=0.2186
+ throughput/total_tokens=226,368,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1180/500000]
+ optim/total_grad_norm=5.480
+ train/ActionNoiseL2Loss=0.1884
+ throughput/total_tokens=226,560,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1181/500000]
+ train/ActionNoiseL2Loss=0.2563
+ throughput/total_tokens=226,752,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1182/500000]
+ train/ActionNoiseL2Loss=0.1751
+ throughput/total_tokens=226,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1183/500000]
+ train/ActionNoiseL2Loss=0.2117
+ throughput/total_tokens=227,136,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1184/500000]
+ train/ActionNoiseL2Loss=0.1767
+ throughput/total_tokens=227,328,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1185/500000]
+ train/ActionNoiseL2Loss=0.1592
+ throughput/total_tokens=227,520,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1186/500000]
+ train/ActionNoiseL2Loss=0.3060
+ throughput/total_tokens=227,712,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1187/500000]
+ train/ActionNoiseL2Loss=0.2436
+ throughput/total_tokens=227,904,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1188/500000]
+ train/ActionNoiseL2Loss=0.2560
+ throughput/total_tokens=228,096,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1189/500000]
+ train/ActionNoiseL2Loss=0.3174
+ throughput/total_tokens=228,288,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1190/500000]
+ train/ActionNoiseL2Loss=0.1865
+ throughput/total_tokens=228,480,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1191/500000]
+ train/ActionNoiseL2Loss=0.2133
+ throughput/total_tokens=228,672,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1192/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=228,864,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1193/500000]
+ train/ActionNoiseL2Loss=0.1951
+ throughput/total_tokens=229,056,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1194/500000]
+ train/ActionNoiseL2Loss=0.1891
+ throughput/total_tokens=229,248,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1195/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=229,440,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1196/500000]
+ train/ActionNoiseL2Loss=0.2008
+ throughput/total_tokens=229,632,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1197/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=229,824,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1198/500000]
+ train/ActionNoiseL2Loss=0.2116
+ throughput/total_tokens=230,016,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1199/500000]
+ train/ActionNoiseL2Loss=0.2066
+ throughput/total_tokens=230,208,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1200/500000]
+ optim/total_grad_norm=5.451
+ train/ActionNoiseL2Loss=0.2145
+ throughput/total_tokens=230,400,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1201/500000]
+ train/ActionNoiseL2Loss=0.2038
+ throughput/total_tokens=230,592,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1202/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=230,784,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1203/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=230,976,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1204/500000]
+ train/ActionNoiseL2Loss=0.2623
+ throughput/total_tokens=231,168,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1205/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=231,360,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1206/500000]
+ train/ActionNoiseL2Loss=0.3001
+ throughput/total_tokens=231,552,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1207/500000]
+ train/ActionNoiseL2Loss=0.1895
+ throughput/total_tokens=231,744,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1208/500000]
+ train/ActionNoiseL2Loss=0.1556
+ throughput/total_tokens=231,936,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1209/500000]
+ train/ActionNoiseL2Loss=0.1759
+ throughput/total_tokens=232,128,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1210/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=232,320,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1211/500000]
+ train/ActionNoiseL2Loss=0.2875
+ throughput/total_tokens=232,512,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1212/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=232,704,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1213/500000]
+ train/ActionNoiseL2Loss=0.3281
+ throughput/total_tokens=232,896,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1214/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=233,088,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1215/500000]
+ train/ActionNoiseL2Loss=0.3042
+ throughput/total_tokens=233,280,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1216/500000]
+ train/ActionNoiseL2Loss=0.3239
+ throughput/total_tokens=233,472,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1217/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=233,664,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1218/500000]
+ train/ActionNoiseL2Loss=0.2162
+ throughput/total_tokens=233,856,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1219/500000]
+ train/ActionNoiseL2Loss=0.1846
+ throughput/total_tokens=234,048,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1220/500000]
+ optim/total_grad_norm=3.463
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=234,240,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1221/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=234,432,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1222/500000]
+ train/ActionNoiseL2Loss=0.3310
+ throughput/total_tokens=234,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1223/500000]
+ train/ActionNoiseL2Loss=0.2363
+ throughput/total_tokens=234,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1224/500000]
+ train/ActionNoiseL2Loss=0.1758
+ throughput/total_tokens=235,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1225/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=235,200,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1226/500000]
+ train/ActionNoiseL2Loss=0.1741
+ throughput/total_tokens=235,392,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1227/500000]
+ train/ActionNoiseL2Loss=0.2176
+ throughput/total_tokens=235,584,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1228/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=235,776,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1229/500000]
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=235,968,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1230/500000]
+ train/ActionNoiseL2Loss=0.1863
+ throughput/total_tokens=236,160,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1231/500000]
+ train/ActionNoiseL2Loss=0.2587
+ throughput/total_tokens=236,352,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1232/500000]
+ train/ActionNoiseL2Loss=0.2558
+ throughput/total_tokens=236,544,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1233/500000]
+ train/ActionNoiseL2Loss=0.2338
+ throughput/total_tokens=236,736,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1234/500000]
+ train/ActionNoiseL2Loss=0.3546
+ throughput/total_tokens=236,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1235/500000]
+ train/ActionNoiseL2Loss=0.2262
+ throughput/total_tokens=237,120,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1236/500000]
+ train/ActionNoiseL2Loss=0.2129
+ throughput/total_tokens=237,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1237/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=237,504,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1238/500000]
+ train/ActionNoiseL2Loss=0.1845
+ throughput/total_tokens=237,696,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1239/500000]
+ train/ActionNoiseL2Loss=0.2286
+ throughput/total_tokens=237,888,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1240/500000]
+ optim/total_grad_norm=4.124
+ train/ActionNoiseL2Loss=0.1776
+ throughput/total_tokens=238,080,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1241/500000]
+ train/ActionNoiseL2Loss=0.1997
+ throughput/total_tokens=238,272,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1242/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=238,464,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1243/500000]
+ train/ActionNoiseL2Loss=0.2273
+ throughput/total_tokens=238,656,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1244/500000]
+ train/ActionNoiseL2Loss=0.2215
+ throughput/total_tokens=238,848,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1245/500000]
+ train/ActionNoiseL2Loss=0.2012
+ throughput/total_tokens=239,040,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1246/500000]
+ train/ActionNoiseL2Loss=0.2158
+ throughput/total_tokens=239,232,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1247/500000]
+ train/ActionNoiseL2Loss=0.1956
+ throughput/total_tokens=239,424,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1248/500000]
+ train/ActionNoiseL2Loss=0.1881
+ throughput/total_tokens=239,616,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1249/500000]
+ train/ActionNoiseL2Loss=0.1622
+ throughput/total_tokens=239,808,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1250/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=240,000,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1251/500000]
+ train/ActionNoiseL2Loss=0.1881
+ throughput/total_tokens=240,192,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1252/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=240,384,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1253/500000]
+ train/ActionNoiseL2Loss=0.1959
+ throughput/total_tokens=240,576,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1254/500000]
+ train/ActionNoiseL2Loss=0.1512
+ throughput/total_tokens=240,768,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1255/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=240,960,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1256/500000]
+ train/ActionNoiseL2Loss=0.2090
+ throughput/total_tokens=241,152,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1257/500000]
+ train/ActionNoiseL2Loss=0.1896
+ throughput/total_tokens=241,344,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1258/500000]
+ train/ActionNoiseL2Loss=0.1771
+ throughput/total_tokens=241,536,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1259/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=241,728,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1260/500000]
+ optim/total_grad_norm=4.171
+ train/ActionNoiseL2Loss=0.1839
+ throughput/total_tokens=241,920,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1261/500000]
+ train/ActionNoiseL2Loss=0.1885
+ throughput/total_tokens=242,112,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1262/500000]
+ train/ActionNoiseL2Loss=0.2798
+ throughput/total_tokens=242,304,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1263/500000]
+ train/ActionNoiseL2Loss=0.1695
+ throughput/total_tokens=242,496,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1264/500000]
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=242,688,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1265/500000]
+ train/ActionNoiseL2Loss=0.1833
+ throughput/total_tokens=242,880,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1266/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=243,072,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1267/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=243,264,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1268/500000]
+ train/ActionNoiseL2Loss=0.1818
+ throughput/total_tokens=243,456,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1269/500000]
+ train/ActionNoiseL2Loss=0.2123
+ throughput/total_tokens=243,648,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1270/500000]
+ train/ActionNoiseL2Loss=0.2244
+ throughput/total_tokens=243,840,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1271/500000]
+ train/ActionNoiseL2Loss=0.1540
+ throughput/total_tokens=244,032,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1272/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=244,224,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1273/500000]
+ train/ActionNoiseL2Loss=0.1928
+ throughput/total_tokens=244,416,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1274/500000]
+ train/ActionNoiseL2Loss=0.1778
+ throughput/total_tokens=244,608,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1275/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=244,800,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1276/500000]
+ train/ActionNoiseL2Loss=0.2107
+ throughput/total_tokens=244,992,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1277/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=245,184,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1278/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=245,376,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1279/500000]
+ train/ActionNoiseL2Loss=0.2038
+ throughput/total_tokens=245,568,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1280/500000]
+ optim/total_grad_norm=4.075
+ train/ActionNoiseL2Loss=0.1814
+ throughput/total_tokens=245,760,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1281/500000]
+ train/ActionNoiseL2Loss=0.1642
+ throughput/total_tokens=245,952,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1282/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=246,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1283/500000]
+ train/ActionNoiseL2Loss=0.2076
+ throughput/total_tokens=246,336,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1284/500000]
+ train/ActionNoiseL2Loss=0.2120
+ throughput/total_tokens=246,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1285/500000]
+ train/ActionNoiseL2Loss=0.1933
+ throughput/total_tokens=246,720,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1286/500000]
+ train/ActionNoiseL2Loss=0.2324
+ throughput/total_tokens=246,912,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1287/500000]
+ train/ActionNoiseL2Loss=0.1868
+ throughput/total_tokens=247,104,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1288/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=247,296,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1289/500000]
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=247,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1290/500000]
+ train/ActionNoiseL2Loss=0.2166
+ throughput/total_tokens=247,680,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1291/500000]
+ train/ActionNoiseL2Loss=0.2887
+ throughput/total_tokens=247,872,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1292/500000]
+ train/ActionNoiseL2Loss=0.1619
+ throughput/total_tokens=248,064,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1293/500000]
+ train/ActionNoiseL2Loss=0.2765
+ throughput/total_tokens=248,256,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1294/500000]
+ train/ActionNoiseL2Loss=0.2177
+ throughput/total_tokens=248,448,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1295/500000]
+ train/ActionNoiseL2Loss=0.1763
+ throughput/total_tokens=248,640,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1296/500000]
+ train/ActionNoiseL2Loss=0.2996
+ throughput/total_tokens=248,832,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1297/500000]
+ train/ActionNoiseL2Loss=0.1902
+ throughput/total_tokens=249,024,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1298/500000]
+ train/ActionNoiseL2Loss=0.2646
+ throughput/total_tokens=249,216,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1299/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=249,408,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=1300/500000]
+ optim/total_grad_norm=2.550
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=249,600,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1301/500000]
+ train/ActionNoiseL2Loss=0.1858
+ throughput/total_tokens=249,792,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1302/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=249,984,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1303/500000]
+ train/ActionNoiseL2Loss=0.1889
+ throughput/total_tokens=250,176,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1304/500000]
+ train/ActionNoiseL2Loss=0.1727
+ throughput/total_tokens=250,368,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1305/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=250,560,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1306/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=250,752,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1307/500000]
+ train/ActionNoiseL2Loss=0.2474
+ throughput/total_tokens=250,944,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1308/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=251,136,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1309/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=251,328,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1310/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=251,520,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1311/500000]
+ train/ActionNoiseL2Loss=0.1954
+ throughput/total_tokens=251,712,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1312/500000]
+ train/ActionNoiseL2Loss=0.2332
+ throughput/total_tokens=251,904,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1313/500000]
+ train/ActionNoiseL2Loss=0.2017
+ throughput/total_tokens=252,096,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1314/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=252,288,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1315/500000]
+ train/ActionNoiseL2Loss=0.1875
+ throughput/total_tokens=252,480,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1316/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=252,672,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1317/500000]
+ train/ActionNoiseL2Loss=0.1894
+ throughput/total_tokens=252,864,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1318/500000]
+ train/ActionNoiseL2Loss=0.2422
+ throughput/total_tokens=253,056,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1319/500000]
+ train/ActionNoiseL2Loss=0.2305
+ throughput/total_tokens=253,248,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1320/500000]
+ optim/total_grad_norm=4.744
+ train/ActionNoiseL2Loss=0.2191
+ throughput/total_tokens=253,440,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1321/500000]
+ train/ActionNoiseL2Loss=0.2757
+ throughput/total_tokens=253,632,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1322/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=253,824,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1323/500000]
+ train/ActionNoiseL2Loss=0.2233
+ throughput/total_tokens=254,016,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1324/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=254,208,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1325/500000]
+ train/ActionNoiseL2Loss=0.1798
+ throughput/total_tokens=254,400,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1326/500000]
+ train/ActionNoiseL2Loss=0.1356
+ throughput/total_tokens=254,592,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1327/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=254,784,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1328/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=254,976,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1329/500000]
+ train/ActionNoiseL2Loss=0.1721
+ throughput/total_tokens=255,168,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1330/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=255,360,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1331/500000]
+ train/ActionNoiseL2Loss=0.2855
+ throughput/total_tokens=255,552,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1332/500000]
+ train/ActionNoiseL2Loss=0.2559
+ throughput/total_tokens=255,744,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1333/500000]
+ train/ActionNoiseL2Loss=0.2104
+ throughput/total_tokens=255,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1334/500000]
+ train/ActionNoiseL2Loss=0.2045
+ throughput/total_tokens=256,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1335/500000]
+ train/ActionNoiseL2Loss=0.2437
+ throughput/total_tokens=256,320,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1336/500000]
+ train/ActionNoiseL2Loss=0.2168
+ throughput/total_tokens=256,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1337/500000]
+ train/ActionNoiseL2Loss=0.1918
+ throughput/total_tokens=256,704,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1338/500000]
+ train/ActionNoiseL2Loss=0.2114
+ throughput/total_tokens=256,896,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1339/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=257,088,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1340/500000]
+ optim/total_grad_norm=4.442
+ train/ActionNoiseL2Loss=0.1853
+ throughput/total_tokens=257,280,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1341/500000]
+ train/ActionNoiseL2Loss=0.1799
+ throughput/total_tokens=257,472,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1342/500000]
+ train/ActionNoiseL2Loss=0.2110
+ throughput/total_tokens=257,664,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1343/500000]
+ train/ActionNoiseL2Loss=0.1316
+ throughput/total_tokens=257,856,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1344/500000]
+ train/ActionNoiseL2Loss=0.2657
+ throughput/total_tokens=258,048,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1345/500000]
+ train/ActionNoiseL2Loss=0.1462
+ throughput/total_tokens=258,240,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1346/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=258,432,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1347/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=258,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1348/500000]
+ train/ActionNoiseL2Loss=0.3902
+ throughput/total_tokens=258,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1349/500000]
+ train/ActionNoiseL2Loss=0.1923
+ throughput/total_tokens=259,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1350/500000]
+ train/ActionNoiseL2Loss=0.2193
+ throughput/total_tokens=259,200,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1351/500000]
+ train/ActionNoiseL2Loss=0.1594
+ throughput/total_tokens=259,392,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1352/500000]
+ train/ActionNoiseL2Loss=0.2109
+ throughput/total_tokens=259,584,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1353/500000]
+ train/ActionNoiseL2Loss=0.1768
+ throughput/total_tokens=259,776,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1354/500000]
+ train/ActionNoiseL2Loss=0.3030
+ throughput/total_tokens=259,968,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1355/500000]
+ train/ActionNoiseL2Loss=0.2055
+ throughput/total_tokens=260,160,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1356/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=260,352,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1357/500000]
+ train/ActionNoiseL2Loss=0.1695
+ throughput/total_tokens=260,544,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1358/500000]
+ train/ActionNoiseL2Loss=0.2404
+ throughput/total_tokens=260,736,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1359/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=260,928,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1360/500000]
+ optim/total_grad_norm=5.405
+ train/ActionNoiseL2Loss=0.2100
+ throughput/total_tokens=261,120,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,539
+[step=1361/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=261,312,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1362/500000]
+ train/ActionNoiseL2Loss=0.2885
+ throughput/total_tokens=261,504,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1363/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=261,696,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1364/500000]
+ train/ActionNoiseL2Loss=0.2485
+ throughput/total_tokens=261,888,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1365/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=262,080,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1366/500000]
+ train/ActionNoiseL2Loss=0.2616
+ throughput/total_tokens=262,272,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1367/500000]
+ train/ActionNoiseL2Loss=0.1966
+ throughput/total_tokens=262,464,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1368/500000]
+ train/ActionNoiseL2Loss=0.1759
+ throughput/total_tokens=262,656,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1369/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=262,848,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1370/500000]
+ train/ActionNoiseL2Loss=0.3467
+ throughput/total_tokens=263,040,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1371/500000]
+ train/ActionNoiseL2Loss=0.1916
+ throughput/total_tokens=263,232,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1372/500000]
+ train/ActionNoiseL2Loss=0.3095
+ throughput/total_tokens=263,424,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1373/500000]
+ train/ActionNoiseL2Loss=0.2491
+ throughput/total_tokens=263,616,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1374/500000]
+ train/ActionNoiseL2Loss=0.2555
+ throughput/total_tokens=263,808,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1375/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=264,000,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1376/500000]
+ train/ActionNoiseL2Loss=0.1800
+ throughput/total_tokens=264,192,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1377/500000]
+ train/ActionNoiseL2Loss=0.1732
+ throughput/total_tokens=264,384,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1378/500000]
+ train/ActionNoiseL2Loss=0.2578
+ throughput/total_tokens=264,576,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1379/500000]
+ train/ActionNoiseL2Loss=0.2069
+ throughput/total_tokens=264,768,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1380/500000]
+ optim/total_grad_norm=3.581
+ train/ActionNoiseL2Loss=0.1755
+ throughput/total_tokens=264,960,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1381/500000]
+ train/ActionNoiseL2Loss=0.2257
+ throughput/total_tokens=265,152,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1382/500000]
+ train/ActionNoiseL2Loss=0.4064
+ throughput/total_tokens=265,344,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1383/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=265,536,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1384/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=265,728,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1385/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=265,920,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1386/500000]
+ train/ActionNoiseL2Loss=0.1580
+ throughput/total_tokens=266,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1387/500000]
+ train/ActionNoiseL2Loss=0.2402
+ throughput/total_tokens=266,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1388/500000]
+ train/ActionNoiseL2Loss=0.2429
+ throughput/total_tokens=266,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1389/500000]
+ train/ActionNoiseL2Loss=0.2621
+ throughput/total_tokens=266,688,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1390/500000]
+ train/ActionNoiseL2Loss=0.1907
+ throughput/total_tokens=266,880,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1391/500000]
+ train/ActionNoiseL2Loss=0.1316
+ throughput/total_tokens=267,072,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1392/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=267,264,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1393/500000]
+ train/ActionNoiseL2Loss=0.2054
+ throughput/total_tokens=267,456,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1394/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=267,648,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1395/500000]
+ train/ActionNoiseL2Loss=0.1726
+ throughput/total_tokens=267,840,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1396/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=268,032,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1397/500000]
+ train/ActionNoiseL2Loss=0.1799
+ throughput/total_tokens=268,224,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1398/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=268,416,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1399/500000]
+ train/ActionNoiseL2Loss=0.3406
+ throughput/total_tokens=268,608,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1400/500000]
+ optim/total_grad_norm=5.190
+ train/ActionNoiseL2Loss=0.1691
+ throughput/total_tokens=268,800,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1401/500000]
+ train/ActionNoiseL2Loss=0.2204
+ throughput/total_tokens=268,992,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1402/500000]
+ train/ActionNoiseL2Loss=0.2480
+ throughput/total_tokens=269,184,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1403/500000]
+ train/ActionNoiseL2Loss=0.1512
+ throughput/total_tokens=269,376,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1404/500000]
+ train/ActionNoiseL2Loss=0.2063
+ throughput/total_tokens=269,568,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1405/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=269,760,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1406/500000]
+ train/ActionNoiseL2Loss=0.2333
+ throughput/total_tokens=269,952,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1407/500000]
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=270,144,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1408/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=270,336,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1409/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=270,528,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1410/500000]
+ train/ActionNoiseL2Loss=0.3005
+ throughput/total_tokens=270,720,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1411/500000]
+ train/ActionNoiseL2Loss=0.2909
+ throughput/total_tokens=270,912,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1412/500000]
+ train/ActionNoiseL2Loss=0.1679
+ throughput/total_tokens=271,104,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1413/500000]
+ train/ActionNoiseL2Loss=0.2878
+ throughput/total_tokens=271,296,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1414/500000]
+ train/ActionNoiseL2Loss=0.1989
+ throughput/total_tokens=271,488,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1415/500000]
+ train/ActionNoiseL2Loss=0.1587
+ throughput/total_tokens=271,680,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1416/500000]
+ train/ActionNoiseL2Loss=0.2255
+ throughput/total_tokens=271,872,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1417/500000]
+ train/ActionNoiseL2Loss=0.1837
+ throughput/total_tokens=272,064,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1418/500000]
+ train/ActionNoiseL2Loss=0.2543
+ throughput/total_tokens=272,256,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1419/500000]
+ train/ActionNoiseL2Loss=0.2494
+ throughput/total_tokens=272,448,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1420/500000]
+ optim/total_grad_norm=4.090
+ train/ActionNoiseL2Loss=0.1647
+ throughput/total_tokens=272,640,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1421/500000]
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=272,832,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1422/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=273,024,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1423/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=273,216,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1424/500000]
+ train/ActionNoiseL2Loss=0.2826
+ throughput/total_tokens=273,408,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1425/500000]
+ train/ActionNoiseL2Loss=0.2260
+ throughput/total_tokens=273,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1426/500000]
+ train/ActionNoiseL2Loss=0.1492
+ throughput/total_tokens=273,792,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1427/500000]
+ train/ActionNoiseL2Loss=0.2272
+ throughput/total_tokens=273,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1428/500000]
+ train/ActionNoiseL2Loss=0.1806
+ throughput/total_tokens=274,176,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1429/500000]
+ train/ActionNoiseL2Loss=0.2454
+ throughput/total_tokens=274,368,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1430/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=274,560,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1431/500000]
+ train/ActionNoiseL2Loss=0.1947
+ throughput/total_tokens=274,752,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1432/500000]
+ train/ActionNoiseL2Loss=0.2589
+ throughput/total_tokens=274,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1433/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=275,136,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1434/500000]
+ train/ActionNoiseL2Loss=0.1938
+ throughput/total_tokens=275,328,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1435/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=275,520,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1436/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=275,712,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1437/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=275,904,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1438/500000]
+ train/ActionNoiseL2Loss=0.1663
+ throughput/total_tokens=276,096,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1439/500000]
+ train/ActionNoiseL2Loss=0.1715
+ throughput/total_tokens=276,288,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1440/500000]
+ optim/total_grad_norm=3.679
+ train/ActionNoiseL2Loss=0.1827
+ throughput/total_tokens=276,480,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1441/500000]
+ train/ActionNoiseL2Loss=0.1675
+ throughput/total_tokens=276,672,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1442/500000]
+ train/ActionNoiseL2Loss=0.2509
+ throughput/total_tokens=276,864,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1443/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=277,056,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1444/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=277,248,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=1445/500000]
+ train/ActionNoiseL2Loss=0.1836
+ throughput/total_tokens=277,440,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=1446/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=277,632,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=1447/500000]
+ train/ActionNoiseL2Loss=0.2199
+ throughput/total_tokens=277,824,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1448/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=278,016,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1449/500000]
+ train/ActionNoiseL2Loss=0.2248
+ throughput/total_tokens=278,208,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1450/500000]
+ train/ActionNoiseL2Loss=0.2002
+ throughput/total_tokens=278,400,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,539
+[step=1451/500000]
+ train/ActionNoiseL2Loss=0.2821
+ throughput/total_tokens=278,592,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1452/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=278,784,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1453/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=278,976,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1454/500000]
+ train/ActionNoiseL2Loss=0.3101
+ throughput/total_tokens=279,168,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=1455/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=279,360,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=1456/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=279,552,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1457/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=279,744,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1458/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=279,936,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1459/500000]
+ train/ActionNoiseL2Loss=0.1785
+ throughput/total_tokens=280,128,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1460/500000]
+ optim/total_grad_norm=6.503
+ train/ActionNoiseL2Loss=0.2576
+ throughput/total_tokens=280,320,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,539
+[step=1461/500000]
+ train/ActionNoiseL2Loss=0.3575
+ throughput/total_tokens=280,512,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1462/500000]
+ train/ActionNoiseL2Loss=0.1481
+ throughput/total_tokens=280,704,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1463/500000]
+ train/ActionNoiseL2Loss=0.1716
+ throughput/total_tokens=280,896,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1464/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=281,088,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1465/500000]
+ train/ActionNoiseL2Loss=0.1702
+ throughput/total_tokens=281,280,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1466/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=281,472,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1467/500000]
+ train/ActionNoiseL2Loss=0.1927
+ throughput/total_tokens=281,664,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1468/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=281,856,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1469/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=282,048,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1470/500000]
+ train/ActionNoiseL2Loss=0.2019
+ throughput/total_tokens=282,240,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1471/500000]
+ train/ActionNoiseL2Loss=0.2028
+ throughput/total_tokens=282,432,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1472/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=282,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1473/500000]
+ train/ActionNoiseL2Loss=0.2436
+ throughput/total_tokens=282,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1474/500000]
+ train/ActionNoiseL2Loss=0.2438
+ throughput/total_tokens=283,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1475/500000]
+ train/ActionNoiseL2Loss=0.1541
+ throughput/total_tokens=283,200,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1476/500000]
+ train/ActionNoiseL2Loss=0.2539
+ throughput/total_tokens=283,392,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1477/500000]
+ train/ActionNoiseL2Loss=0.2320
+ throughput/total_tokens=283,584,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1478/500000]
+ train/ActionNoiseL2Loss=0.2143
+ throughput/total_tokens=283,776,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1479/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=283,968,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1480/500000]
+ optim/total_grad_norm=4.337
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=284,160,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=1481/500000]
+ train/ActionNoiseL2Loss=0.2207
+ throughput/total_tokens=284,352,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1482/500000]
+ train/ActionNoiseL2Loss=0.1772
+ throughput/total_tokens=284,544,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1483/500000]
+ train/ActionNoiseL2Loss=0.2631
+ throughput/total_tokens=284,736,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1484/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=284,928,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1485/500000]
+ train/ActionNoiseL2Loss=0.2225
+ throughput/total_tokens=285,120,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1486/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=285,312,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1487/500000]
+ train/ActionNoiseL2Loss=0.2299
+ throughput/total_tokens=285,504,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1488/500000]
+ train/ActionNoiseL2Loss=0.2506
+ throughput/total_tokens=285,696,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1489/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=285,888,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1490/500000]
+ train/ActionNoiseL2Loss=0.1859
+ throughput/total_tokens=286,080,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=1491/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=286,272,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1492/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=286,464,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1493/500000]
+ train/ActionNoiseL2Loss=0.2348
+ throughput/total_tokens=286,656,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1494/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=286,848,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1495/500000]
+ train/ActionNoiseL2Loss=0.1614
+ throughput/total_tokens=287,040,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1496/500000]
+ train/ActionNoiseL2Loss=0.1812
+ throughput/total_tokens=287,232,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1497/500000]
+ train/ActionNoiseL2Loss=0.2721
+ throughput/total_tokens=287,424,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1498/500000]
+ train/ActionNoiseL2Loss=0.2578
+ throughput/total_tokens=287,616,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1499/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=287,808,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1500/500000]
+ optim/total_grad_norm=3.676
+ train/ActionNoiseL2Loss=0.1992
+ throughput/total_tokens=288,000,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+09/28 [19:56:21] INFO | >> Saving config... checkpoint.py:608
+09/28 [19:56:50] INFO | >> Saving model state... checkpoint.py:796
+09/28 [19:57:53] INFO | >> Saving optim state... checkpoint.py:811
+09/28 [19:57:58] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1501/500000]
+ train/ActionNoiseL2Loss=0.1711
+ throughput/total_tokens=288,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1502/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=288,384,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1503/500000]
+ train/ActionNoiseL2Loss=0.3055
+ throughput/total_tokens=288,576,000
+ throughput/device/tokens_per_second=1,078
+ throughput/device/batches_per_second=0.0449
+[step=1504/500000]
+ train/ActionNoiseL2Loss=0.2863
+ throughput/total_tokens=288,768,000
+ throughput/device/tokens_per_second=1,079
+ throughput/device/batches_per_second=0.0450
+[step=1505/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=288,960,000
+ throughput/device/tokens_per_second=1,086
+ throughput/device/batches_per_second=0.0453
+[step=1506/500000]
+ train/ActionNoiseL2Loss=0.2711
+ throughput/total_tokens=289,152,000
+ throughput/device/tokens_per_second=1,090
+ throughput/device/batches_per_second=0.0455
+[step=1507/500000]
+ train/ActionNoiseL2Loss=0.1211
+ throughput/total_tokens=289,344,000
+ throughput/device/tokens_per_second=1,095
+ throughput/device/batches_per_second=0.0456
+[step=1508/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=289,536,000
+ throughput/device/tokens_per_second=1,097
+ throughput/device/batches_per_second=0.0457
+[step=1509/500000]
+ train/ActionNoiseL2Loss=0.2158
+ throughput/total_tokens=289,728,000
+ throughput/device/tokens_per_second=1,099
+ throughput/device/batches_per_second=0.0458
+[step=1510/500000]
+ train/ActionNoiseL2Loss=0.2309
+ throughput/total_tokens=289,920,000
+ throughput/device/tokens_per_second=1,101
+ throughput/device/batches_per_second=0.0459
+ System/Peak GPU Memory (MB)=44,539
+[step=1511/500000]
+ train/ActionNoiseL2Loss=0.1879
+ throughput/total_tokens=290,112,000
+ throughput/device/tokens_per_second=1,102
+ throughput/device/batches_per_second=0.0459
+[step=1512/500000]
+ train/ActionNoiseL2Loss=0.1918
+ throughput/total_tokens=290,304,000
+ throughput/device/tokens_per_second=1,103
+ throughput/device/batches_per_second=0.0460
+[step=1513/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=290,496,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1514/500000]
+ train/ActionNoiseL2Loss=0.2126
+ throughput/total_tokens=290,688,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1515/500000]
+ train/ActionNoiseL2Loss=0.2206
+ throughput/total_tokens=290,880,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=1516/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=291,072,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=1517/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=291,264,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=1518/500000]
+ train/ActionNoiseL2Loss=0.2313
+ throughput/total_tokens=291,456,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=1519/500000]
+ train/ActionNoiseL2Loss=0.1733
+ throughput/total_tokens=291,648,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=1520/500000]
+ optim/total_grad_norm=2.852
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=291,840,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,539
+[step=1521/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=292,032,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=1522/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=292,224,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1523/500000]
+ train/ActionNoiseL2Loss=0.2144
+ throughput/total_tokens=292,416,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1524/500000]
+ train/ActionNoiseL2Loss=0.1573
+ throughput/total_tokens=292,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1525/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=292,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1526/500000]
+ train/ActionNoiseL2Loss=0.2907
+ throughput/total_tokens=292,992,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1527/500000]
+ train/ActionNoiseL2Loss=0.1918
+ throughput/total_tokens=293,184,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1528/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=293,376,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1529/500000]
+ train/ActionNoiseL2Loss=0.1581
+ throughput/total_tokens=293,568,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1530/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=293,760,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1531/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=293,952,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1532/500000]
+ train/ActionNoiseL2Loss=0.2903
+ throughput/total_tokens=294,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1533/500000]
+ train/ActionNoiseL2Loss=0.2395
+ throughput/total_tokens=294,336,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1534/500000]
+ train/ActionNoiseL2Loss=0.2709
+ throughput/total_tokens=294,528,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1535/500000]
+ train/ActionNoiseL2Loss=0.2023
+ throughput/total_tokens=294,720,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1536/500000]
+ train/ActionNoiseL2Loss=0.1779
+ throughput/total_tokens=294,912,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1537/500000]
+ train/ActionNoiseL2Loss=0.1696
+ throughput/total_tokens=295,104,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1538/500000]
+ train/ActionNoiseL2Loss=0.2910
+ throughput/total_tokens=295,296,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1539/500000]
+ train/ActionNoiseL2Loss=0.1926
+ throughput/total_tokens=295,488,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1540/500000]
+ optim/total_grad_norm=3.541
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=295,680,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1541/500000]
+ train/ActionNoiseL2Loss=0.1764
+ throughput/total_tokens=295,872,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1542/500000]
+ train/ActionNoiseL2Loss=0.1855
+ throughput/total_tokens=296,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1543/500000]
+ train/ActionNoiseL2Loss=0.1211
+ throughput/total_tokens=296,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1544/500000]
+ train/ActionNoiseL2Loss=0.2119
+ throughput/total_tokens=296,448,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1545/500000]
+ train/ActionNoiseL2Loss=0.2144
+ throughput/total_tokens=296,640,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1546/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=296,832,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1547/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=297,024,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1548/500000]
+ train/ActionNoiseL2Loss=0.1651
+ throughput/total_tokens=297,216,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1549/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=297,408,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1550/500000]
+ train/ActionNoiseL2Loss=0.1785
+ throughput/total_tokens=297,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1551/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=297,792,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1552/500000]
+ train/ActionNoiseL2Loss=0.1810
+ throughput/total_tokens=297,984,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1553/500000]
+ train/ActionNoiseL2Loss=0.1913
+ throughput/total_tokens=298,176,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1554/500000]
+ train/ActionNoiseL2Loss=0.2437
+ throughput/total_tokens=298,368,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1555/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=298,560,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1556/500000]
+ train/ActionNoiseL2Loss=0.1752
+ throughput/total_tokens=298,752,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1557/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=298,944,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1558/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=299,136,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1559/500000]
+ train/ActionNoiseL2Loss=0.1581
+ throughput/total_tokens=299,328,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1560/500000]
+ optim/total_grad_norm=2.519
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=299,520,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1561/500000]
+ train/ActionNoiseL2Loss=0.1411
+ throughput/total_tokens=299,712,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1562/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=299,904,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1563/500000]
+ train/ActionNoiseL2Loss=0.1756
+ throughput/total_tokens=300,096,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1564/500000]
+ train/ActionNoiseL2Loss=0.2003
+ throughput/total_tokens=300,288,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1565/500000]
+ train/ActionNoiseL2Loss=0.1507
+ throughput/total_tokens=300,480,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1566/500000]
+ train/ActionNoiseL2Loss=0.2918
+ throughput/total_tokens=300,672,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1567/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=300,864,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1568/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=301,056,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1569/500000]
+ train/ActionNoiseL2Loss=0.2436
+ throughput/total_tokens=301,248,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1570/500000]
+ train/ActionNoiseL2Loss=0.2204
+ throughput/total_tokens=301,440,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1571/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=301,632,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1572/500000]
+ train/ActionNoiseL2Loss=0.1930
+ throughput/total_tokens=301,824,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1573/500000]
+ train/ActionNoiseL2Loss=0.1894
+ throughput/total_tokens=302,016,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1574/500000]
+ train/ActionNoiseL2Loss=0.1869
+ throughput/total_tokens=302,208,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1575/500000]
+ train/ActionNoiseL2Loss=0.1324
+ throughput/total_tokens=302,400,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1576/500000]
+ train/ActionNoiseL2Loss=0.2453
+ throughput/total_tokens=302,592,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1577/500000]
+ train/ActionNoiseL2Loss=0.2426
+ throughput/total_tokens=302,784,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1578/500000]
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=302,976,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1579/500000]
+ train/ActionNoiseL2Loss=0.2507
+ throughput/total_tokens=303,168,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1580/500000]
+ optim/total_grad_norm=2.807
+ train/ActionNoiseL2Loss=0.1742
+ throughput/total_tokens=303,360,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1581/500000]
+ train/ActionNoiseL2Loss=0.1870
+ throughput/total_tokens=303,552,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1582/500000]
+ train/ActionNoiseL2Loss=0.1372
+ throughput/total_tokens=303,744,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1583/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=303,936,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1584/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=304,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1585/500000]
+ train/ActionNoiseL2Loss=0.2192
+ throughput/total_tokens=304,320,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1586/500000]
+ train/ActionNoiseL2Loss=0.1946
+ throughput/total_tokens=304,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1587/500000]
+ train/ActionNoiseL2Loss=0.2010
+ throughput/total_tokens=304,704,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1588/500000]
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=304,896,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1589/500000]
+ train/ActionNoiseL2Loss=0.2072
+ throughput/total_tokens=305,088,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1590/500000]
+ train/ActionNoiseL2Loss=0.1881
+ throughput/total_tokens=305,280,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1591/500000]
+ train/ActionNoiseL2Loss=0.1522
+ throughput/total_tokens=305,472,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1592/500000]
+ train/ActionNoiseL2Loss=0.1809
+ throughput/total_tokens=305,664,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1593/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=305,856,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1594/500000]
+ train/ActionNoiseL2Loss=0.1503
+ throughput/total_tokens=306,048,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1595/500000]
+ train/ActionNoiseL2Loss=0.2421
+ throughput/total_tokens=306,240,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1596/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=306,432,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1597/500000]
+ train/ActionNoiseL2Loss=0.1779
+ throughput/total_tokens=306,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1598/500000]
+ train/ActionNoiseL2Loss=0.1773
+ throughput/total_tokens=306,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1599/500000]
+ train/ActionNoiseL2Loss=0.2657
+ throughput/total_tokens=307,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1600/500000]
+ optim/total_grad_norm=5.643
+ train/ActionNoiseL2Loss=0.2319
+ throughput/total_tokens=307,200,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1601/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=307,392,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1602/500000]
+ train/ActionNoiseL2Loss=0.1842
+ throughput/total_tokens=307,584,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1603/500000]
+ train/ActionNoiseL2Loss=0.1834
+ throughput/total_tokens=307,776,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1604/500000]
+ train/ActionNoiseL2Loss=0.2241
+ throughput/total_tokens=307,968,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1605/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=308,160,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1606/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=308,352,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1607/500000]
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=308,544,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1608/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=308,736,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1609/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=308,928,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1610/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=309,120,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1611/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=309,312,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1612/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=309,504,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1613/500000]
+ train/ActionNoiseL2Loss=0.2615
+ throughput/total_tokens=309,696,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1614/500000]
+ train/ActionNoiseL2Loss=0.1356
+ throughput/total_tokens=309,888,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1615/500000]
+ train/ActionNoiseL2Loss=0.1786
+ throughput/total_tokens=310,080,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1616/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=310,272,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1617/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=310,464,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1618/500000]
+ train/ActionNoiseL2Loss=0.2160
+ throughput/total_tokens=310,656,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1619/500000]
+ train/ActionNoiseL2Loss=0.1985
+ throughput/total_tokens=310,848,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1620/500000]
+ optim/total_grad_norm=2.422
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=311,040,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1621/500000]
+ train/ActionNoiseL2Loss=0.1962
+ throughput/total_tokens=311,232,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1622/500000]
+ train/ActionNoiseL2Loss=0.1900
+ throughput/total_tokens=311,424,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1623/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=311,616,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1624/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=311,808,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1625/500000]
+ train/ActionNoiseL2Loss=0.2186
+ throughput/total_tokens=312,000,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1626/500000]
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=312,192,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1627/500000]
+ train/ActionNoiseL2Loss=0.1694
+ throughput/total_tokens=312,384,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1628/500000]
+ train/ActionNoiseL2Loss=0.2804
+ throughput/total_tokens=312,576,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1629/500000]
+ train/ActionNoiseL2Loss=0.1891
+ throughput/total_tokens=312,768,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1630/500000]
+ train/ActionNoiseL2Loss=0.1613
+ throughput/total_tokens=312,960,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1631/500000]
+ train/ActionNoiseL2Loss=0.1642
+ throughput/total_tokens=313,152,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1632/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=313,344,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1633/500000]
+ train/ActionNoiseL2Loss=0.2137
+ throughput/total_tokens=313,536,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1634/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=313,728,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1635/500000]
+ train/ActionNoiseL2Loss=0.2598
+ throughput/total_tokens=313,920,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1636/500000]
+ train/ActionNoiseL2Loss=0.2793
+ throughput/total_tokens=314,112,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1637/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=314,304,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1638/500000]
+ train/ActionNoiseL2Loss=0.2844
+ throughput/total_tokens=314,496,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1639/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=314,688,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1640/500000]
+ optim/total_grad_norm=3.949
+ train/ActionNoiseL2Loss=0.1865
+ throughput/total_tokens=314,880,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1641/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=315,072,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1642/500000]
+ train/ActionNoiseL2Loss=0.2750
+ throughput/total_tokens=315,264,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1643/500000]
+ train/ActionNoiseL2Loss=0.1447
+ throughput/total_tokens=315,456,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1644/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=315,648,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1645/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=315,840,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1646/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=316,032,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1647/500000]
+ train/ActionNoiseL2Loss=0.1587
+ throughput/total_tokens=316,224,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1648/500000]
+ train/ActionNoiseL2Loss=0.1922
+ throughput/total_tokens=316,416,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1649/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=316,608,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1650/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=316,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1651/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=316,992,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1652/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=317,184,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1653/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=317,376,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1654/500000]
+ train/ActionNoiseL2Loss=0.2301
+ throughput/total_tokens=317,568,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1655/500000]
+ train/ActionNoiseL2Loss=0.2245
+ throughput/total_tokens=317,760,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1656/500000]
+ train/ActionNoiseL2Loss=0.2522
+ throughput/total_tokens=317,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1657/500000]
+ train/ActionNoiseL2Loss=0.2127
+ throughput/total_tokens=318,144,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1658/500000]
+ train/ActionNoiseL2Loss=0.2242
+ throughput/total_tokens=318,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1659/500000]
+ train/ActionNoiseL2Loss=0.1448
+ throughput/total_tokens=318,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1660/500000]
+ optim/total_grad_norm=3.008
+ train/ActionNoiseL2Loss=0.1372
+ throughput/total_tokens=318,720,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1661/500000]
+ train/ActionNoiseL2Loss=0.2756
+ throughput/total_tokens=318,912,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1662/500000]
+ train/ActionNoiseL2Loss=0.2328
+ throughput/total_tokens=319,104,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1663/500000]
+ train/ActionNoiseL2Loss=0.2554
+ throughput/total_tokens=319,296,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1664/500000]
+ train/ActionNoiseL2Loss=0.2547
+ throughput/total_tokens=319,488,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1665/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=319,680,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1666/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=319,872,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1667/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=320,064,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1668/500000]
+ train/ActionNoiseL2Loss=0.2597
+ throughput/total_tokens=320,256,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1669/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=320,448,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1670/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=320,640,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1671/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=320,832,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1672/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=321,024,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1673/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=321,216,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1674/500000]
+ train/ActionNoiseL2Loss=0.2235
+ throughput/total_tokens=321,408,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1675/500000]
+ train/ActionNoiseL2Loss=0.2467
+ throughput/total_tokens=321,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1676/500000]
+ train/ActionNoiseL2Loss=0.2377
+ throughput/total_tokens=321,792,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1677/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=321,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1678/500000]
+ train/ActionNoiseL2Loss=0.1889
+ throughput/total_tokens=322,176,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1679/500000]
+ train/ActionNoiseL2Loss=0.2156
+ throughput/total_tokens=322,368,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1680/500000]
+ optim/total_grad_norm=3.914
+ train/ActionNoiseL2Loss=0.1379
+ throughput/total_tokens=322,560,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1681/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=322,752,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1682/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=322,944,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1683/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=323,136,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1684/500000]
+ train/ActionNoiseL2Loss=0.1701
+ throughput/total_tokens=323,328,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1685/500000]
+ train/ActionNoiseL2Loss=0.2395
+ throughput/total_tokens=323,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1686/500000]
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=323,712,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1687/500000]
+ train/ActionNoiseL2Loss=0.2043
+ throughput/total_tokens=323,904,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1688/500000]
+ train/ActionNoiseL2Loss=0.2269
+ throughput/total_tokens=324,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1689/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=324,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1690/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=324,480,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1691/500000]
+ train/ActionNoiseL2Loss=0.1944
+ throughput/total_tokens=324,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1692/500000]
+ train/ActionNoiseL2Loss=0.1983
+ throughput/total_tokens=324,864,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1693/500000]
+ train/ActionNoiseL2Loss=0.2338
+ throughput/total_tokens=325,056,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1694/500000]
+ train/ActionNoiseL2Loss=0.1711
+ throughput/total_tokens=325,248,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1695/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=325,440,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1696/500000]
+ train/ActionNoiseL2Loss=0.2280
+ throughput/total_tokens=325,632,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1697/500000]
+ train/ActionNoiseL2Loss=0.2519
+ throughput/total_tokens=325,824,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1698/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=326,016,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1699/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=326,208,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1700/500000]
+ optim/total_grad_norm=2.775
+ train/ActionNoiseL2Loss=0.1799
+ throughput/total_tokens=326,400,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1701/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=326,592,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1702/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=326,784,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1703/500000]
+ train/ActionNoiseL2Loss=0.1803
+ throughput/total_tokens=326,976,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1704/500000]
+ train/ActionNoiseL2Loss=0.1789
+ throughput/total_tokens=327,168,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1705/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=327,360,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1706/500000]
+ train/ActionNoiseL2Loss=0.1733
+ throughput/total_tokens=327,552,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1707/500000]
+ train/ActionNoiseL2Loss=0.2369
+ throughput/total_tokens=327,744,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1708/500000]
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=327,936,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1709/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=328,128,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1710/500000]
+ train/ActionNoiseL2Loss=0.1581
+ throughput/total_tokens=328,320,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,539
+[step=1711/500000]
+ train/ActionNoiseL2Loss=0.2174
+ throughput/total_tokens=328,512,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1712/500000]
+ train/ActionNoiseL2Loss=0.1769
+ throughput/total_tokens=328,704,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1713/500000]
+ train/ActionNoiseL2Loss=0.1466
+ throughput/total_tokens=328,896,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1714/500000]
+ train/ActionNoiseL2Loss=0.3613
+ throughput/total_tokens=329,088,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1715/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=329,280,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1716/500000]
+ train/ActionNoiseL2Loss=0.2051
+ throughput/total_tokens=329,472,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1717/500000]
+ train/ActionNoiseL2Loss=0.2384
+ throughput/total_tokens=329,664,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1718/500000]
+ train/ActionNoiseL2Loss=0.1725
+ throughput/total_tokens=329,856,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1719/500000]
+ train/ActionNoiseL2Loss=0.1658
+ throughput/total_tokens=330,048,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1720/500000]
+ optim/total_grad_norm=4.121
+ train/ActionNoiseL2Loss=0.2103
+ throughput/total_tokens=330,240,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1721/500000]
+ train/ActionNoiseL2Loss=0.1986
+ throughput/total_tokens=330,432,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1722/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=330,624,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1723/500000]
+ train/ActionNoiseL2Loss=0.1632
+ throughput/total_tokens=330,816,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1724/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=331,008,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1725/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=331,200,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1726/500000]
+ train/ActionNoiseL2Loss=0.2091
+ throughput/total_tokens=331,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1727/500000]
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=331,584,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1728/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=331,776,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1729/500000]
+ train/ActionNoiseL2Loss=0.1893
+ throughput/total_tokens=331,968,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1730/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=332,160,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1731/500000]
+ train/ActionNoiseL2Loss=0.1793
+ throughput/total_tokens=332,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1732/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=332,544,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1733/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=332,736,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1734/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=332,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1735/500000]
+ train/ActionNoiseL2Loss=0.1924
+ throughput/total_tokens=333,120,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1736/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=333,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1737/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=333,504,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1738/500000]
+ train/ActionNoiseL2Loss=0.2129
+ throughput/total_tokens=333,696,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1739/500000]
+ train/ActionNoiseL2Loss=0.1705
+ throughput/total_tokens=333,888,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1740/500000]
+ optim/total_grad_norm=2.633
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=334,080,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1741/500000]
+ train/ActionNoiseL2Loss=0.2074
+ throughput/total_tokens=334,272,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1742/500000]
+ train/ActionNoiseL2Loss=0.1797
+ throughput/total_tokens=334,464,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1743/500000]
+ train/ActionNoiseL2Loss=0.1455
+ throughput/total_tokens=334,656,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1744/500000]
+ train/ActionNoiseL2Loss=0.1363
+ throughput/total_tokens=334,848,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1745/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=335,040,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1746/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=335,232,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1747/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=335,424,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1748/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=335,616,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1749/500000]
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=335,808,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1750/500000]
+ train/ActionNoiseL2Loss=0.3080
+ throughput/total_tokens=336,000,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1751/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=336,192,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=1752/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=336,384,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1753/500000]
+ train/ActionNoiseL2Loss=0.1738
+ throughput/total_tokens=336,576,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1754/500000]
+ train/ActionNoiseL2Loss=0.2648
+ throughput/total_tokens=336,768,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1755/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=336,960,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=1756/500000]
+ train/ActionNoiseL2Loss=0.1732
+ throughput/total_tokens=337,152,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1757/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=337,344,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1758/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=337,536,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1759/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=337,728,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1760/500000]
+ optim/total_grad_norm=3.206
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=337,920,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,539
+[step=1761/500000]
+ train/ActionNoiseL2Loss=0.1591
+ throughput/total_tokens=338,112,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1762/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=338,304,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=1763/500000]
+ train/ActionNoiseL2Loss=0.2904
+ throughput/total_tokens=338,496,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1764/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=338,688,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1765/500000]
+ train/ActionNoiseL2Loss=0.1999
+ throughput/total_tokens=338,880,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1766/500000]
+ train/ActionNoiseL2Loss=0.1525
+ throughput/total_tokens=339,072,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1767/500000]
+ train/ActionNoiseL2Loss=0.1996
+ throughput/total_tokens=339,264,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1768/500000]
+ train/ActionNoiseL2Loss=0.1838
+ throughput/total_tokens=339,456,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1769/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=339,648,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1770/500000]
+ train/ActionNoiseL2Loss=0.1576
+ throughput/total_tokens=339,840,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1771/500000]
+ train/ActionNoiseL2Loss=0.2148
+ throughput/total_tokens=340,032,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1772/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=340,224,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1773/500000]
+ train/ActionNoiseL2Loss=0.2535
+ throughput/total_tokens=340,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1774/500000]
+ train/ActionNoiseL2Loss=0.2397
+ throughput/total_tokens=340,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1775/500000]
+ train/ActionNoiseL2Loss=0.1533
+ throughput/total_tokens=340,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1776/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=340,992,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1777/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=341,184,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1778/500000]
+ train/ActionNoiseL2Loss=0.2210
+ throughput/total_tokens=341,376,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1779/500000]
+ train/ActionNoiseL2Loss=0.2199
+ throughput/total_tokens=341,568,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1780/500000]
+ optim/total_grad_norm=2.892
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=341,760,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1781/500000]
+ train/ActionNoiseL2Loss=0.1880
+ throughput/total_tokens=341,952,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1782/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=342,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1783/500000]
+ train/ActionNoiseL2Loss=0.2432
+ throughput/total_tokens=342,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1784/500000]
+ train/ActionNoiseL2Loss=0.1707
+ throughput/total_tokens=342,528,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1785/500000]
+ train/ActionNoiseL2Loss=0.2830
+ throughput/total_tokens=342,720,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1786/500000]
+ train/ActionNoiseL2Loss=0.2025
+ throughput/total_tokens=342,912,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1787/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=343,104,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1788/500000]
+ train/ActionNoiseL2Loss=0.1858
+ throughput/total_tokens=343,296,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1789/500000]
+ train/ActionNoiseL2Loss=0.1750
+ throughput/total_tokens=343,488,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1790/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=343,680,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1791/500000]
+ train/ActionNoiseL2Loss=0.1842
+ throughput/total_tokens=343,872,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1792/500000]
+ train/ActionNoiseL2Loss=0.1736
+ throughput/total_tokens=344,064,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1793/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=344,256,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1794/500000]
+ train/ActionNoiseL2Loss=0.1921
+ throughput/total_tokens=344,448,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1795/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=344,640,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1796/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=344,832,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1797/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=345,024,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1798/500000]
+ train/ActionNoiseL2Loss=0.1448
+ throughput/total_tokens=345,216,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1799/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=345,408,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1800/500000]
+ optim/total_grad_norm=3.029
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=345,600,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1801/500000]
+ train/ActionNoiseL2Loss=0.2355
+ throughput/total_tokens=345,792,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1802/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=345,984,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1803/500000]
+ train/ActionNoiseL2Loss=0.1734
+ throughput/total_tokens=346,176,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1804/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=346,368,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1805/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=346,560,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1806/500000]
+ train/ActionNoiseL2Loss=0.1732
+ throughput/total_tokens=346,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1807/500000]
+ train/ActionNoiseL2Loss=0.1702
+ throughput/total_tokens=346,944,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1808/500000]
+ train/ActionNoiseL2Loss=0.1373
+ throughput/total_tokens=347,136,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1809/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=347,328,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1810/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=347,520,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1811/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=347,712,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1812/500000]
+ train/ActionNoiseL2Loss=0.1843
+ throughput/total_tokens=347,904,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1813/500000]
+ train/ActionNoiseL2Loss=0.1373
+ throughput/total_tokens=348,096,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1814/500000]
+ train/ActionNoiseL2Loss=0.2166
+ throughput/total_tokens=348,288,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1815/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=348,480,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1816/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=348,672,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1817/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=348,864,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1818/500000]
+ train/ActionNoiseL2Loss=0.1865
+ throughput/total_tokens=349,056,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1819/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=349,248,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1820/500000]
+ optim/total_grad_norm=2.952
+ train/ActionNoiseL2Loss=0.2227
+ throughput/total_tokens=349,440,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1821/500000]
+ train/ActionNoiseL2Loss=0.2211
+ throughput/total_tokens=349,632,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1822/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=349,824,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1823/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=350,016,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1824/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=350,208,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1825/500000]
+ train/ActionNoiseL2Loss=0.1679
+ throughput/total_tokens=350,400,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1826/500000]
+ train/ActionNoiseL2Loss=0.3007
+ throughput/total_tokens=350,592,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1827/500000]
+ train/ActionNoiseL2Loss=0.1543
+ throughput/total_tokens=350,784,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1828/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=350,976,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1829/500000]
+ train/ActionNoiseL2Loss=0.1693
+ throughput/total_tokens=351,168,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1830/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=351,360,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1831/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=351,552,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1832/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=351,744,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1833/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=351,936,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1834/500000]
+ train/ActionNoiseL2Loss=0.1989
+ throughput/total_tokens=352,128,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1835/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=352,320,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1836/500000]
+ train/ActionNoiseL2Loss=0.2065
+ throughput/total_tokens=352,512,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1837/500000]
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=352,704,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1838/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=352,896,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1839/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=353,088,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1840/500000]
+ optim/total_grad_norm=3.300
+ train/ActionNoiseL2Loss=0.1960
+ throughput/total_tokens=353,280,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=1841/500000]
+ train/ActionNoiseL2Loss=0.1589
+ throughput/total_tokens=353,472,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1842/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=353,664,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1843/500000]
+ train/ActionNoiseL2Loss=0.2415
+ throughput/total_tokens=353,856,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1844/500000]
+ train/ActionNoiseL2Loss=0.3150
+ throughput/total_tokens=354,048,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1845/500000]
+ train/ActionNoiseL2Loss=0.1228
+ throughput/total_tokens=354,240,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1846/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=354,432,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1847/500000]
+ train/ActionNoiseL2Loss=0.1475
+ throughput/total_tokens=354,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1848/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=354,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1849/500000]
+ train/ActionNoiseL2Loss=0.1461
+ throughput/total_tokens=355,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1850/500000]
+ train/ActionNoiseL2Loss=0.2684
+ throughput/total_tokens=355,200,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1851/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=355,392,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1852/500000]
+ train/ActionNoiseL2Loss=0.1657
+ throughput/total_tokens=355,584,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1853/500000]
+ train/ActionNoiseL2Loss=0.1906
+ throughput/total_tokens=355,776,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1854/500000]
+ train/ActionNoiseL2Loss=0.2093
+ throughput/total_tokens=355,968,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1855/500000]
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=356,160,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1856/500000]
+ train/ActionNoiseL2Loss=0.2009
+ throughput/total_tokens=356,352,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1857/500000]
+ train/ActionNoiseL2Loss=0.2233
+ throughput/total_tokens=356,544,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1858/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=356,736,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1859/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=356,928,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1860/500000]
+ optim/total_grad_norm=4.379
+ train/ActionNoiseL2Loss=0.2757
+ throughput/total_tokens=357,120,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1861/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=357,312,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1862/500000]
+ train/ActionNoiseL2Loss=0.1971
+ throughput/total_tokens=357,504,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1863/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=357,696,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1864/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=357,888,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1865/500000]
+ train/ActionNoiseL2Loss=0.2079
+ throughput/total_tokens=358,080,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1866/500000]
+ train/ActionNoiseL2Loss=0.1785
+ throughput/total_tokens=358,272,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1867/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=358,464,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1868/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=358,656,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1869/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=358,848,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=1870/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=359,040,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1871/500000]
+ train/ActionNoiseL2Loss=0.1689
+ throughput/total_tokens=359,232,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1872/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=359,424,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1873/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=359,616,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1874/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=359,808,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1875/500000]
+ train/ActionNoiseL2Loss=0.1792
+ throughput/total_tokens=360,000,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1876/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=360,192,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1877/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=360,384,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1878/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=360,576,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1879/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=360,768,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1880/500000]
+ optim/total_grad_norm=2.937
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=360,960,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1881/500000]
+ train/ActionNoiseL2Loss=0.1534
+ throughput/total_tokens=361,152,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1882/500000]
+ train/ActionNoiseL2Loss=0.2336
+ throughput/total_tokens=361,344,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1883/500000]
+ train/ActionNoiseL2Loss=0.1827
+ throughput/total_tokens=361,536,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1884/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=361,728,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1885/500000]
+ train/ActionNoiseL2Loss=0.1852
+ throughput/total_tokens=361,920,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1886/500000]
+ train/ActionNoiseL2Loss=0.1861
+ throughput/total_tokens=362,112,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1887/500000]
+ train/ActionNoiseL2Loss=0.1386
+ throughput/total_tokens=362,304,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1888/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=362,496,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1889/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=362,688,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1890/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=362,880,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=1891/500000]
+ train/ActionNoiseL2Loss=0.2308
+ throughput/total_tokens=363,072,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1892/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=363,264,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1893/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=363,456,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1894/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=363,648,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1895/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=363,840,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1896/500000]
+ train/ActionNoiseL2Loss=0.2564
+ throughput/total_tokens=364,032,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1897/500000]
+ train/ActionNoiseL2Loss=0.1803
+ throughput/total_tokens=364,224,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1898/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=364,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1899/500000]
+ train/ActionNoiseL2Loss=0.2535
+ throughput/total_tokens=364,608,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=1900/500000]
+ optim/total_grad_norm=2.601
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=364,800,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1901/500000]
+ train/ActionNoiseL2Loss=0.3026
+ throughput/total_tokens=364,992,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1902/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=365,184,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1903/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=365,376,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1904/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=365,568,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1905/500000]
+ train/ActionNoiseL2Loss=0.2115
+ throughput/total_tokens=365,760,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=1906/500000]
+ train/ActionNoiseL2Loss=0.1714
+ throughput/total_tokens=365,952,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=1907/500000]
+ train/ActionNoiseL2Loss=0.1976
+ throughput/total_tokens=366,144,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1908/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=366,336,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1909/500000]
+ train/ActionNoiseL2Loss=0.2009
+ throughput/total_tokens=366,528,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1910/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=366,720,000
+ throughput/device/tokens_per_second=1,103
+ throughput/device/batches_per_second=0.0460
+ System/Peak GPU Memory (MB)=44,539
+[step=1911/500000]
+ train/ActionNoiseL2Loss=0.1451
+ throughput/total_tokens=366,912,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1912/500000]
+ train/ActionNoiseL2Loss=0.2115
+ throughput/total_tokens=367,104,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1913/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=367,296,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1914/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=367,488,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1915/500000]
+ train/ActionNoiseL2Loss=0.2511
+ throughput/total_tokens=367,680,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1916/500000]
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=367,872,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1917/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=368,064,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1918/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=368,256,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=1919/500000]
+ train/ActionNoiseL2Loss=0.1528
+ throughput/total_tokens=368,448,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=1920/500000]
+ optim/total_grad_norm=3.592
+ train/ActionNoiseL2Loss=0.1911
+ throughput/total_tokens=368,640,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1921/500000]
+ train/ActionNoiseL2Loss=0.2331
+ throughput/total_tokens=368,832,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1922/500000]
+ train/ActionNoiseL2Loss=0.1451
+ throughput/total_tokens=369,024,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1923/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=369,216,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1924/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=369,408,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1925/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=369,600,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1926/500000]
+ train/ActionNoiseL2Loss=0.2689
+ throughput/total_tokens=369,792,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1927/500000]
+ train/ActionNoiseL2Loss=0.2227
+ throughput/total_tokens=369,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1928/500000]
+ train/ActionNoiseL2Loss=0.2009
+ throughput/total_tokens=370,176,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1929/500000]
+ train/ActionNoiseL2Loss=0.1826
+ throughput/total_tokens=370,368,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1930/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=370,560,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1931/500000]
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=370,752,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1932/500000]
+ train/ActionNoiseL2Loss=0.2103
+ throughput/total_tokens=370,944,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1933/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=371,136,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1934/500000]
+ train/ActionNoiseL2Loss=0.1697
+ throughput/total_tokens=371,328,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1935/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=371,520,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1936/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=371,712,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1937/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=371,904,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1938/500000]
+ train/ActionNoiseL2Loss=0.2088
+ throughput/total_tokens=372,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1939/500000]
+ train/ActionNoiseL2Loss=0.2714
+ throughput/total_tokens=372,288,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1940/500000]
+ optim/total_grad_norm=4.163
+ train/ActionNoiseL2Loss=0.2026
+ throughput/total_tokens=372,480,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1941/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=372,672,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1942/500000]
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=372,864,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1943/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=373,056,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1944/500000]
+ train/ActionNoiseL2Loss=0.1854
+ throughput/total_tokens=373,248,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1945/500000]
+ train/ActionNoiseL2Loss=0.2182
+ throughput/total_tokens=373,440,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=1946/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=373,632,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1947/500000]
+ train/ActionNoiseL2Loss=0.1981
+ throughput/total_tokens=373,824,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1948/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=374,016,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1949/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=374,208,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=1950/500000]
+ train/ActionNoiseL2Loss=0.1629
+ throughput/total_tokens=374,400,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,539
+[step=1951/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=374,592,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1952/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=374,784,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1953/500000]
+ train/ActionNoiseL2Loss=0.2362
+ throughput/total_tokens=374,976,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1954/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=375,168,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1955/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=375,360,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1956/500000]
+ train/ActionNoiseL2Loss=0.1558
+ throughput/total_tokens=375,552,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1957/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=375,744,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1958/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=375,936,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1959/500000]
+ train/ActionNoiseL2Loss=0.1952
+ throughput/total_tokens=376,128,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1960/500000]
+ optim/total_grad_norm=3.020
+ train/ActionNoiseL2Loss=0.1561
+ throughput/total_tokens=376,320,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+[step=1961/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=376,512,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1962/500000]
+ train/ActionNoiseL2Loss=0.1737
+ throughput/total_tokens=376,704,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1963/500000]
+ train/ActionNoiseL2Loss=0.2045
+ throughput/total_tokens=376,896,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1964/500000]
+ train/ActionNoiseL2Loss=0.1249
+ throughput/total_tokens=377,088,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1965/500000]
+ train/ActionNoiseL2Loss=0.1587
+ throughput/total_tokens=377,280,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1966/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=377,472,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1967/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=377,664,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1968/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=377,856,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1969/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=378,048,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=1970/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=378,240,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,539
+[step=1971/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=378,432,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=1972/500000]
+ train/ActionNoiseL2Loss=0.2503
+ throughput/total_tokens=378,624,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=1973/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=378,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1974/500000]
+ train/ActionNoiseL2Loss=0.2620
+ throughput/total_tokens=379,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1975/500000]
+ train/ActionNoiseL2Loss=0.1884
+ throughput/total_tokens=379,200,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1976/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=379,392,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1977/500000]
+ train/ActionNoiseL2Loss=0.1922
+ throughput/total_tokens=379,584,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1978/500000]
+ train/ActionNoiseL2Loss=0.2035
+ throughput/total_tokens=379,776,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1979/500000]
+ train/ActionNoiseL2Loss=0.1893
+ throughput/total_tokens=379,968,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1980/500000]
+ optim/total_grad_norm=2.381
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=380,160,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1981/500000]
+ train/ActionNoiseL2Loss=0.1948
+ throughput/total_tokens=380,352,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1982/500000]
+ train/ActionNoiseL2Loss=0.1903
+ throughput/total_tokens=380,544,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1983/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=380,736,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1984/500000]
+ train/ActionNoiseL2Loss=0.1569
+ throughput/total_tokens=380,928,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1985/500000]
+ train/ActionNoiseL2Loss=0.1873
+ throughput/total_tokens=381,120,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1986/500000]
+ train/ActionNoiseL2Loss=0.2146
+ throughput/total_tokens=381,312,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1987/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=381,504,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1988/500000]
+ train/ActionNoiseL2Loss=0.1772
+ throughput/total_tokens=381,696,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1989/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=381,888,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=1990/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=382,080,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,539
+[step=1991/500000]
+ train/ActionNoiseL2Loss=0.2106
+ throughput/total_tokens=382,272,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=1992/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=382,464,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1993/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=382,656,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1994/500000]
+ train/ActionNoiseL2Loss=0.2270
+ throughput/total_tokens=382,848,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1995/500000]
+ train/ActionNoiseL2Loss=0.2518
+ throughput/total_tokens=383,040,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1996/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=383,232,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1997/500000]
+ train/ActionNoiseL2Loss=0.2070
+ throughput/total_tokens=383,424,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1998/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=383,616,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=1999/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=383,808,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2000/500000]
+ optim/total_grad_norm=2.923
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=384,000,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,539
+09/28 [22:58:51] INFO | >> Saving config... checkpoint.py:608
+09/28 [22:59:20] INFO | >> Saving model state... checkpoint.py:796
+09/28 [23:00:22] INFO | >> Saving optim state... checkpoint.py:811
+09/28 [23:00:26] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2001/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=384,192,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2002/500000]
+ train/ActionNoiseL2Loss=0.2433
+ throughput/total_tokens=384,384,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2003/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=384,576,000
+ throughput/device/tokens_per_second=1,069
+ throughput/device/batches_per_second=0.0445
+[step=2004/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=384,768,000
+ throughput/device/tokens_per_second=1,079
+ throughput/device/batches_per_second=0.0450
+[step=2005/500000]
+ train/ActionNoiseL2Loss=0.2507
+ throughput/total_tokens=384,960,000
+ throughput/device/tokens_per_second=1,086
+ throughput/device/batches_per_second=0.0453
+[step=2006/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=385,152,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=2007/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=385,344,000
+ throughput/device/tokens_per_second=1,095
+ throughput/device/batches_per_second=0.0456
+[step=2008/500000]
+ train/ActionNoiseL2Loss=0.1592
+ throughput/total_tokens=385,536,000
+ throughput/device/tokens_per_second=1,097
+ throughput/device/batches_per_second=0.0457
+[step=2009/500000]
+ train/ActionNoiseL2Loss=0.1715
+ throughput/total_tokens=385,728,000
+ throughput/device/tokens_per_second=1,099
+ throughput/device/batches_per_second=0.0458
+[step=2010/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=385,920,000
+ throughput/device/tokens_per_second=1,101
+ throughput/device/batches_per_second=0.0459
+ System/Peak GPU Memory (MB)=44,547
+[step=2011/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=386,112,000
+ throughput/device/tokens_per_second=1,102
+ throughput/device/batches_per_second=0.0459
+[step=2012/500000]
+ train/ActionNoiseL2Loss=0.2246
+ throughput/total_tokens=386,304,000
+ throughput/device/tokens_per_second=1,103
+ throughput/device/batches_per_second=0.0460
+[step=2013/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=386,496,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=2014/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=386,688,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=2015/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=386,880,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2016/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=387,072,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2017/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=387,264,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=2018/500000]
+ train/ActionNoiseL2Loss=0.1742
+ throughput/total_tokens=387,456,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=2019/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=387,648,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2020/500000]
+ optim/total_grad_norm=2.791
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=387,840,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,547
+[step=2021/500000]
+ train/ActionNoiseL2Loss=0.1481
+ throughput/total_tokens=388,032,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2022/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=388,224,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2023/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=388,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2024/500000]
+ train/ActionNoiseL2Loss=0.1886
+ throughput/total_tokens=388,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2025/500000]
+ train/ActionNoiseL2Loss=0.2111
+ throughput/total_tokens=388,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2026/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=388,992,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2027/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=389,184,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2028/500000]
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=389,376,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2029/500000]
+ train/ActionNoiseL2Loss=0.1745
+ throughput/total_tokens=389,568,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2030/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=389,760,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2031/500000]
+ train/ActionNoiseL2Loss=0.1573
+ throughput/total_tokens=389,952,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2032/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=390,144,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2033/500000]
+ train/ActionNoiseL2Loss=0.1451
+ throughput/total_tokens=390,336,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2034/500000]
+ train/ActionNoiseL2Loss=0.2994
+ throughput/total_tokens=390,528,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2035/500000]
+ train/ActionNoiseL2Loss=0.1827
+ throughput/total_tokens=390,720,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2036/500000]
+ train/ActionNoiseL2Loss=0.1629
+ throughput/total_tokens=390,912,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2037/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=391,104,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2038/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=391,296,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2039/500000]
+ train/ActionNoiseL2Loss=0.2392
+ throughput/total_tokens=391,488,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2040/500000]
+ optim/total_grad_norm=2.714
+ train/ActionNoiseL2Loss=0.1925
+ throughput/total_tokens=391,680,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2041/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=391,872,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2042/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=392,064,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2043/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=392,256,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2044/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=392,448,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2045/500000]
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=392,640,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2046/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=392,832,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2047/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=393,024,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2048/500000]
+ train/ActionNoiseL2Loss=0.2068
+ throughput/total_tokens=393,216,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2049/500000]
+ train/ActionNoiseL2Loss=0.1859
+ throughput/total_tokens=393,408,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2050/500000]
+ train/ActionNoiseL2Loss=0.2134
+ throughput/total_tokens=393,600,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2051/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=393,792,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2052/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=393,984,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2053/500000]
+ train/ActionNoiseL2Loss=0.1751
+ throughput/total_tokens=394,176,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2054/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=394,368,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2055/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=394,560,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2056/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=394,752,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2057/500000]
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=394,944,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2058/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=395,136,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2059/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=395,328,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2060/500000]
+ optim/total_grad_norm=2.688
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=395,520,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=2061/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=395,712,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2062/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=395,904,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2063/500000]
+ train/ActionNoiseL2Loss=0.2008
+ throughput/total_tokens=396,096,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2064/500000]
+ train/ActionNoiseL2Loss=0.1767
+ throughput/total_tokens=396,288,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2065/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=396,480,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2066/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=396,672,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2067/500000]
+ train/ActionNoiseL2Loss=0.1404
+ throughput/total_tokens=396,864,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2068/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=397,056,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2069/500000]
+ train/ActionNoiseL2Loss=0.1351
+ throughput/total_tokens=397,248,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2070/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=397,440,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2071/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=397,632,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2072/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=397,824,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2073/500000]
+ train/ActionNoiseL2Loss=0.1726
+ throughput/total_tokens=398,016,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2074/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=398,208,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2075/500000]
+ train/ActionNoiseL2Loss=0.1771
+ throughput/total_tokens=398,400,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2076/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=398,592,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2077/500000]
+ train/ActionNoiseL2Loss=0.1948
+ throughput/total_tokens=398,784,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2078/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=398,976,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2079/500000]
+ train/ActionNoiseL2Loss=0.1739
+ throughput/total_tokens=399,168,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2080/500000]
+ optim/total_grad_norm=3.407
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=399,360,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2081/500000]
+ train/ActionNoiseL2Loss=0.1694
+ throughput/total_tokens=399,552,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2082/500000]
+ train/ActionNoiseL2Loss=0.2746
+ throughput/total_tokens=399,744,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2083/500000]
+ train/ActionNoiseL2Loss=0.1375
+ throughput/total_tokens=399,936,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2084/500000]
+ train/ActionNoiseL2Loss=0.1547
+ throughput/total_tokens=400,128,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2085/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=400,320,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2086/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=400,512,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2087/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=400,704,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2088/500000]
+ train/ActionNoiseL2Loss=0.1462
+ throughput/total_tokens=400,896,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2089/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=401,088,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2090/500000]
+ train/ActionNoiseL2Loss=0.1661
+ throughput/total_tokens=401,280,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2091/500000]
+ train/ActionNoiseL2Loss=0.1454
+ throughput/total_tokens=401,472,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2092/500000]
+ train/ActionNoiseL2Loss=0.1749
+ throughput/total_tokens=401,664,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2093/500000]
+ train/ActionNoiseL2Loss=0.2229
+ throughput/total_tokens=401,856,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2094/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=402,048,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2095/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=402,240,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2096/500000]
+ train/ActionNoiseL2Loss=0.1754
+ throughput/total_tokens=402,432,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2097/500000]
+ train/ActionNoiseL2Loss=0.1513
+ throughput/total_tokens=402,624,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2098/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=402,816,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2099/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=403,008,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2100/500000]
+ optim/total_grad_norm=1.917
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=403,200,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2101/500000]
+ train/ActionNoiseL2Loss=0.2820
+ throughput/total_tokens=403,392,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2102/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=403,584,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2103/500000]
+ train/ActionNoiseL2Loss=0.1425
+ throughput/total_tokens=403,776,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2104/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=403,968,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2105/500000]
+ train/ActionNoiseL2Loss=0.1351
+ throughput/total_tokens=404,160,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2106/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=404,352,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2107/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=404,544,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2108/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=404,736,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2109/500000]
+ train/ActionNoiseL2Loss=0.2015
+ throughput/total_tokens=404,928,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2110/500000]
+ train/ActionNoiseL2Loss=0.1919
+ throughput/total_tokens=405,120,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2111/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=405,312,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2112/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=405,504,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2113/500000]
+ train/ActionNoiseL2Loss=0.1614
+ throughput/total_tokens=405,696,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2114/500000]
+ train/ActionNoiseL2Loss=0.1744
+ throughput/total_tokens=405,888,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2115/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=406,080,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2116/500000]
+ train/ActionNoiseL2Loss=0.2028
+ throughput/total_tokens=406,272,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2117/500000]
+ train/ActionNoiseL2Loss=0.1526
+ throughput/total_tokens=406,464,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2118/500000]
+ train/ActionNoiseL2Loss=0.1883
+ throughput/total_tokens=406,656,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2119/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=406,848,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2120/500000]
+ optim/total_grad_norm=2.267
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=407,040,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2121/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=407,232,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2122/500000]
+ train/ActionNoiseL2Loss=0.1732
+ throughput/total_tokens=407,424,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2123/500000]
+ train/ActionNoiseL2Loss=0.2281
+ throughput/total_tokens=407,616,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2124/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=407,808,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2125/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=408,000,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2126/500000]
+ train/ActionNoiseL2Loss=0.1597
+ throughput/total_tokens=408,192,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2127/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=408,384,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2128/500000]
+ train/ActionNoiseL2Loss=0.1512
+ throughput/total_tokens=408,576,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2129/500000]
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=408,768,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2130/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=408,960,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2131/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=409,152,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2132/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=409,344,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2133/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=409,536,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2134/500000]
+ train/ActionNoiseL2Loss=0.2222
+ throughput/total_tokens=409,728,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2135/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=409,920,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2136/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=410,112,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2137/500000]
+ train/ActionNoiseL2Loss=0.2083
+ throughput/total_tokens=410,304,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2138/500000]
+ train/ActionNoiseL2Loss=0.1649
+ throughput/total_tokens=410,496,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2139/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=410,688,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2140/500000]
+ optim/total_grad_norm=3.111
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=410,880,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2141/500000]
+ train/ActionNoiseL2Loss=0.1240
+ throughput/total_tokens=411,072,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2142/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=411,264,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2143/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=411,456,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2144/500000]
+ train/ActionNoiseL2Loss=0.1924
+ throughput/total_tokens=411,648,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2145/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=411,840,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2146/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=412,032,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2147/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=412,224,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2148/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=412,416,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2149/500000]
+ train/ActionNoiseL2Loss=0.1900
+ throughput/total_tokens=412,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2150/500000]
+ train/ActionNoiseL2Loss=0.2827
+ throughput/total_tokens=412,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2151/500000]
+ train/ActionNoiseL2Loss=0.1541
+ throughput/total_tokens=412,992,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2152/500000]
+ train/ActionNoiseL2Loss=0.2142
+ throughput/total_tokens=413,184,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2153/500000]
+ train/ActionNoiseL2Loss=0.1695
+ throughput/total_tokens=413,376,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2154/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=413,568,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2155/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=413,760,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2156/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=413,952,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2157/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=414,144,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2158/500000]
+ train/ActionNoiseL2Loss=0.1990
+ throughput/total_tokens=414,336,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2159/500000]
+ train/ActionNoiseL2Loss=0.2142
+ throughput/total_tokens=414,528,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2160/500000]
+ optim/total_grad_norm=3.520
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=414,720,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2161/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=414,912,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2162/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=415,104,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2163/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=415,296,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2164/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=415,488,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2165/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=415,680,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2166/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=415,872,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2167/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=416,064,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2168/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=416,256,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2169/500000]
+ train/ActionNoiseL2Loss=0.1621
+ throughput/total_tokens=416,448,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=2170/500000]
+ train/ActionNoiseL2Loss=0.1623
+ throughput/total_tokens=416,640,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,547
+[step=2171/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=416,832,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2172/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=417,024,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2173/500000]
+ train/ActionNoiseL2Loss=0.1403
+ throughput/total_tokens=417,216,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2174/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=417,408,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2175/500000]
+ train/ActionNoiseL2Loss=0.1877
+ throughput/total_tokens=417,600,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2176/500000]
+ train/ActionNoiseL2Loss=0.2386
+ throughput/total_tokens=417,792,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2177/500000]
+ train/ActionNoiseL2Loss=0.2958
+ throughput/total_tokens=417,984,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2178/500000]
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=418,176,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2179/500000]
+ train/ActionNoiseL2Loss=0.2556
+ throughput/total_tokens=418,368,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2180/500000]
+ optim/total_grad_norm=1.425
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=418,560,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,547
+[step=2181/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=418,752,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2182/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=418,944,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2183/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=419,136,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2184/500000]
+ train/ActionNoiseL2Loss=0.1787
+ throughput/total_tokens=419,328,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2185/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=419,520,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2186/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=419,712,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2187/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=419,904,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2188/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=420,096,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2189/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=420,288,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2190/500000]
+ train/ActionNoiseL2Loss=0.1914
+ throughput/total_tokens=420,480,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2191/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=420,672,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2192/500000]
+ train/ActionNoiseL2Loss=0.2057
+ throughput/total_tokens=420,864,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2193/500000]
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=421,056,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2194/500000]
+ train/ActionNoiseL2Loss=0.2286
+ throughput/total_tokens=421,248,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2195/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=421,440,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2196/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=421,632,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2197/500000]
+ train/ActionNoiseL2Loss=0.1944
+ throughput/total_tokens=421,824,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2198/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=422,016,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2199/500000]
+ train/ActionNoiseL2Loss=0.1922
+ throughput/total_tokens=422,208,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2200/500000]
+ optim/total_grad_norm=2.778
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=422,400,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2201/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=422,592,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2202/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=422,784,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2203/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=422,976,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2204/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=423,168,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2205/500000]
+ train/ActionNoiseL2Loss=0.1983
+ throughput/total_tokens=423,360,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2206/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=423,552,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2207/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=423,744,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2208/500000]
+ train/ActionNoiseL2Loss=0.1490
+ throughput/total_tokens=423,936,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2209/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=424,128,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2210/500000]
+ train/ActionNoiseL2Loss=0.1425
+ throughput/total_tokens=424,320,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2211/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=424,512,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2212/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=424,704,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2213/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=424,896,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2214/500000]
+ train/ActionNoiseL2Loss=0.1811
+ throughput/total_tokens=425,088,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2215/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=425,280,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2216/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=425,472,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2217/500000]
+ train/ActionNoiseL2Loss=0.2214
+ throughput/total_tokens=425,664,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2218/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=425,856,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2219/500000]
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=426,048,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2220/500000]
+ optim/total_grad_norm=2.618
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=426,240,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2221/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=426,432,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2222/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=426,624,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2223/500000]
+ train/ActionNoiseL2Loss=0.2038
+ throughput/total_tokens=426,816,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2224/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=427,008,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2225/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=427,200,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2226/500000]
+ train/ActionNoiseL2Loss=0.2360
+ throughput/total_tokens=427,392,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2227/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=427,584,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2228/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=427,776,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2229/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=427,968,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2230/500000]
+ train/ActionNoiseL2Loss=0.2014
+ throughput/total_tokens=428,160,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2231/500000]
+ train/ActionNoiseL2Loss=0.1974
+ throughput/total_tokens=428,352,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2232/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=428,544,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2233/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=428,736,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2234/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=428,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2235/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=429,120,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2236/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=429,312,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2237/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=429,504,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2238/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=429,696,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2239/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=429,888,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2240/500000]
+ optim/total_grad_norm=2.913
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=430,080,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2241/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=430,272,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2242/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=430,464,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2243/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=430,656,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2244/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=430,848,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2245/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=431,040,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2246/500000]
+ train/ActionNoiseL2Loss=0.1801
+ throughput/total_tokens=431,232,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2247/500000]
+ train/ActionNoiseL2Loss=0.1663
+ throughput/total_tokens=431,424,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2248/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=431,616,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2249/500000]
+ train/ActionNoiseL2Loss=0.1709
+ throughput/total_tokens=431,808,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2250/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=432,000,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2251/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=432,192,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2252/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=432,384,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2253/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=432,576,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2254/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=432,768,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2255/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=432,960,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2256/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=433,152,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2257/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=433,344,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2258/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=433,536,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2259/500000]
+ train/ActionNoiseL2Loss=0.1707
+ throughput/total_tokens=433,728,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2260/500000]
+ optim/total_grad_norm=2.288
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=433,920,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2261/500000]
+ train/ActionNoiseL2Loss=0.1556
+ throughput/total_tokens=434,112,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2262/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=434,304,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2263/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=434,496,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2264/500000]
+ train/ActionNoiseL2Loss=0.2530
+ throughput/total_tokens=434,688,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2265/500000]
+ train/ActionNoiseL2Loss=0.1762
+ throughput/total_tokens=434,880,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2266/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=435,072,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2267/500000]
+ train/ActionNoiseL2Loss=0.1707
+ throughput/total_tokens=435,264,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2268/500000]
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=435,456,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2269/500000]
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=435,648,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2270/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=435,840,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2271/500000]
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=436,032,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2272/500000]
+ train/ActionNoiseL2Loss=0.1545
+ throughput/total_tokens=436,224,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2273/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=436,416,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2274/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=436,608,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2275/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=436,800,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2276/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=436,992,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2277/500000]
+ train/ActionNoiseL2Loss=0.2241
+ throughput/total_tokens=437,184,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2278/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=437,376,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2279/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=437,568,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2280/500000]
+ optim/total_grad_norm=2.249
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=437,760,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2281/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=437,952,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2282/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=438,144,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2283/500000]
+ train/ActionNoiseL2Loss=0.1442
+ throughput/total_tokens=438,336,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2284/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=438,528,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2285/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=438,720,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2286/500000]
+ train/ActionNoiseL2Loss=0.1592
+ throughput/total_tokens=438,912,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2287/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=439,104,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2288/500000]
+ train/ActionNoiseL2Loss=0.1810
+ throughput/total_tokens=439,296,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2289/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=439,488,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2290/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=439,680,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2291/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=439,872,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2292/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=440,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2293/500000]
+ train/ActionNoiseL2Loss=0.1819
+ throughput/total_tokens=440,256,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2294/500000]
+ train/ActionNoiseL2Loss=0.2230
+ throughput/total_tokens=440,448,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2295/500000]
+ train/ActionNoiseL2Loss=0.1373
+ throughput/total_tokens=440,640,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2296/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=440,832,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2297/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=441,024,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2298/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=441,216,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2299/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=441,408,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2300/500000]
+ optim/total_grad_norm=3.509
+ train/ActionNoiseL2Loss=0.2053
+ throughput/total_tokens=441,600,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2301/500000]
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=441,792,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2302/500000]
+ train/ActionNoiseL2Loss=0.1958
+ throughput/total_tokens=441,984,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2303/500000]
+ train/ActionNoiseL2Loss=0.1657
+ throughput/total_tokens=442,176,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2304/500000]
+ train/ActionNoiseL2Loss=0.2323
+ throughput/total_tokens=442,368,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2305/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=442,560,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2306/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=442,752,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2307/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=442,944,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2308/500000]
+ train/ActionNoiseL2Loss=0.1295
+ throughput/total_tokens=443,136,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2309/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=443,328,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2310/500000]
+ train/ActionNoiseL2Loss=0.1734
+ throughput/total_tokens=443,520,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2311/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=443,712,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2312/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=443,904,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2313/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=444,096,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2314/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=444,288,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2315/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=444,480,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2316/500000]
+ train/ActionNoiseL2Loss=0.1940
+ throughput/total_tokens=444,672,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2317/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=444,864,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2318/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=445,056,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2319/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=445,248,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2320/500000]
+ optim/total_grad_norm=2.137
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=445,440,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2321/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=445,632,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2322/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=445,824,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2323/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=446,016,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2324/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=446,208,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2325/500000]
+ train/ActionNoiseL2Loss=0.1749
+ throughput/total_tokens=446,400,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2326/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=446,592,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2327/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=446,784,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2328/500000]
+ train/ActionNoiseL2Loss=0.1728
+ throughput/total_tokens=446,976,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2329/500000]
+ train/ActionNoiseL2Loss=0.1549
+ throughput/total_tokens=447,168,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2330/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=447,360,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2331/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=447,552,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2332/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=447,744,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=2333/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=447,936,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2334/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=448,128,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2335/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=448,320,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2336/500000]
+ train/ActionNoiseL2Loss=0.1798
+ throughput/total_tokens=448,512,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2337/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=448,704,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2338/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=448,896,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=2339/500000]
+ train/ActionNoiseL2Loss=0.2068
+ throughput/total_tokens=449,088,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=2340/500000]
+ optim/total_grad_norm=2.599
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=449,280,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,547
+[step=2341/500000]
+ train/ActionNoiseL2Loss=0.1621
+ throughput/total_tokens=449,472,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=2342/500000]
+ train/ActionNoiseL2Loss=0.1447
+ throughput/total_tokens=449,664,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=2343/500000]
+ train/ActionNoiseL2Loss=0.1812
+ throughput/total_tokens=449,856,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=2344/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=450,048,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=2345/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=450,240,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2346/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=450,432,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2347/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=450,624,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2348/500000]
+ train/ActionNoiseL2Loss=0.2138
+ throughput/total_tokens=450,816,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2349/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=451,008,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2350/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=451,200,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,547
+[step=2351/500000]
+ train/ActionNoiseL2Loss=0.2269
+ throughput/total_tokens=451,392,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2352/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=451,584,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2353/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=451,776,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2354/500000]
+ train/ActionNoiseL2Loss=0.2102
+ throughput/total_tokens=451,968,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2355/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=452,160,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2356/500000]
+ train/ActionNoiseL2Loss=0.1559
+ throughput/total_tokens=452,352,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2357/500000]
+ train/ActionNoiseL2Loss=0.1576
+ throughput/total_tokens=452,544,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2358/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=452,736,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2359/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=452,928,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2360/500000]
+ optim/total_grad_norm=2.556
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=453,120,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2361/500000]
+ train/ActionNoiseL2Loss=0.1644
+ throughput/total_tokens=453,312,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2362/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=453,504,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2363/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=453,696,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2364/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=453,888,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2365/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=454,080,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2366/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=454,272,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2367/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=454,464,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2368/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=454,656,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2369/500000]
+ train/ActionNoiseL2Loss=0.1679
+ throughput/total_tokens=454,848,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2370/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=455,040,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2371/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=455,232,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2372/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=455,424,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2373/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=455,616,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2374/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=455,808,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2375/500000]
+ train/ActionNoiseL2Loss=0.2040
+ throughput/total_tokens=456,000,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2376/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=456,192,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2377/500000]
+ train/ActionNoiseL2Loss=0.2102
+ throughput/total_tokens=456,384,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2378/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=456,576,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2379/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=456,768,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2380/500000]
+ optim/total_grad_norm=2.292
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=456,960,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2381/500000]
+ train/ActionNoiseL2Loss=0.1406
+ throughput/total_tokens=457,152,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2382/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=457,344,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2383/500000]
+ train/ActionNoiseL2Loss=0.1705
+ throughput/total_tokens=457,536,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2384/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=457,728,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2385/500000]
+ train/ActionNoiseL2Loss=0.1936
+ throughput/total_tokens=457,920,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2386/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=458,112,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2387/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=458,304,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2388/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=458,496,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2389/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=458,688,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2390/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=458,880,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2391/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=459,072,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2392/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=459,264,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2393/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=459,456,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2394/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=459,648,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2395/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=459,840,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2396/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=460,032,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2397/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=460,224,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2398/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=460,416,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2399/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=460,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2400/500000]
+ optim/total_grad_norm=2.375
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=460,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2401/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=460,992,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2402/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=461,184,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2403/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=461,376,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2404/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=461,568,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2405/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=461,760,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2406/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=461,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2407/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=462,144,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2408/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=462,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2409/500000]
+ train/ActionNoiseL2Loss=0.1613
+ throughput/total_tokens=462,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2410/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=462,720,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2411/500000]
+ train/ActionNoiseL2Loss=0.2284
+ throughput/total_tokens=462,912,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2412/500000]
+ train/ActionNoiseL2Loss=0.1576
+ throughput/total_tokens=463,104,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2413/500000]
+ train/ActionNoiseL2Loss=0.1537
+ throughput/total_tokens=463,296,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2414/500000]
+ train/ActionNoiseL2Loss=0.1949
+ throughput/total_tokens=463,488,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2415/500000]
+ train/ActionNoiseL2Loss=0.1888
+ throughput/total_tokens=463,680,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2416/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=463,872,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2417/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=464,064,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2418/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=464,256,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2419/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=464,448,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2420/500000]
+ optim/total_grad_norm=2.422
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=464,640,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2421/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=464,832,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2422/500000]
+ train/ActionNoiseL2Loss=0.1928
+ throughput/total_tokens=465,024,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2423/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=465,216,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2424/500000]
+ train/ActionNoiseL2Loss=0.1459
+ throughput/total_tokens=465,408,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2425/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=465,600,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2426/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=465,792,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2427/500000]
+ train/ActionNoiseL2Loss=0.1526
+ throughput/total_tokens=465,984,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2428/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=466,176,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2429/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=466,368,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2430/500000]
+ train/ActionNoiseL2Loss=0.2470
+ throughput/total_tokens=466,560,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2431/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=466,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2432/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=466,944,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2433/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=467,136,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2434/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=467,328,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2435/500000]
+ train/ActionNoiseL2Loss=0.1677
+ throughput/total_tokens=467,520,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2436/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=467,712,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2437/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=467,904,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2438/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=468,096,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2439/500000]
+ train/ActionNoiseL2Loss=0.1541
+ throughput/total_tokens=468,288,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2440/500000]
+ optim/total_grad_norm=2.042
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=468,480,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2441/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=468,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2442/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=468,864,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2443/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=469,056,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2444/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=469,248,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2445/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=469,440,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2446/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=469,632,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2447/500000]
+ train/ActionNoiseL2Loss=0.1609
+ throughput/total_tokens=469,824,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2448/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=470,016,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2449/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=470,208,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2450/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=470,400,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2451/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=470,592,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2452/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=470,784,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2453/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=470,976,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2454/500000]
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=471,168,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2455/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=471,360,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2456/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=471,552,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2457/500000]
+ train/ActionNoiseL2Loss=0.1495
+ throughput/total_tokens=471,744,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=2458/500000]
+ train/ActionNoiseL2Loss=0.1521
+ throughput/total_tokens=471,936,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=2459/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=472,128,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2460/500000]
+ optim/total_grad_norm=2.508
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=472,320,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,547
+[step=2461/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=472,512,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2462/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=472,704,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2463/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=472,896,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2464/500000]
+ train/ActionNoiseL2Loss=0.1624
+ throughput/total_tokens=473,088,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2465/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=473,280,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2466/500000]
+ train/ActionNoiseL2Loss=0.1816
+ throughput/total_tokens=473,472,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2467/500000]
+ train/ActionNoiseL2Loss=0.2297
+ throughput/total_tokens=473,664,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2468/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=473,856,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2469/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=474,048,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2470/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=474,240,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2471/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=474,432,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2472/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=474,624,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2473/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=474,816,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2474/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=475,008,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2475/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=475,200,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2476/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=475,392,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2477/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=475,584,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2478/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=475,776,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2479/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=475,968,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2480/500000]
+ optim/total_grad_norm=1.626
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=476,160,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2481/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=476,352,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2482/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=476,544,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2483/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=476,736,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2484/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=476,928,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2485/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=477,120,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2486/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=477,312,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2487/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=477,504,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2488/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=477,696,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2489/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=477,888,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2490/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=478,080,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2491/500000]
+ train/ActionNoiseL2Loss=0.1483
+ throughput/total_tokens=478,272,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2492/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=478,464,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2493/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=478,656,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2494/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=478,848,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2495/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=479,040,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2496/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=479,232,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2497/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=479,424,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2498/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=479,616,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2499/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=479,808,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2500/500000]
+ optim/total_grad_norm=2.414
+ train/ActionNoiseL2Loss=0.1569
+ throughput/total_tokens=480,000,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+09/29 [02:01:14] INFO | >> Saving config... checkpoint.py:608
+09/29 [02:01:42] INFO | >> Saving model state... checkpoint.py:796
+09/29 [02:02:42] INFO | >> Saving optim state... checkpoint.py:811
+09/29 [02:02:47] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2501/500000]
+ train/ActionNoiseL2Loss=0.1716
+ throughput/total_tokens=480,192,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2502/500000]
+ train/ActionNoiseL2Loss=0.1500
+ throughput/total_tokens=480,384,000
+ throughput/device/tokens_per_second=1,102
+ throughput/device/batches_per_second=0.0459
+[step=2503/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=480,576,000
+ throughput/device/tokens_per_second=1,084
+ throughput/device/batches_per_second=0.0452
+[step=2504/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=480,768,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=2505/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=480,960,000
+ throughput/device/tokens_per_second=1,096
+ throughput/device/batches_per_second=0.0457
+[step=2506/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=481,152,000
+ throughput/device/tokens_per_second=1,100
+ throughput/device/batches_per_second=0.0459
+[step=2507/500000]
+ train/ActionNoiseL2Loss=0.1801
+ throughput/total_tokens=481,344,000
+ throughput/device/tokens_per_second=1,103
+ throughput/device/batches_per_second=0.0460
+[step=2508/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=481,536,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=2509/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=481,728,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=2510/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=481,920,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,547
+[step=2511/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=482,112,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2512/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=482,304,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2513/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=482,496,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2514/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=482,688,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2515/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=482,880,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2516/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=483,072,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2517/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=483,264,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2518/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=483,456,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2519/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=483,648,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2520/500000]
+ optim/total_grad_norm=2.630
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=483,840,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=2521/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=484,032,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2522/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=484,224,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2523/500000]
+ train/ActionNoiseL2Loss=0.1930
+ throughput/total_tokens=484,416,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2524/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=484,608,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2525/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=484,800,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2526/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=484,992,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2527/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=485,184,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2528/500000]
+ train/ActionNoiseL2Loss=0.1535
+ throughput/total_tokens=485,376,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2529/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=485,568,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2530/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=485,760,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2531/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=485,952,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2532/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=486,144,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2533/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=486,336,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2534/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=486,528,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2535/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=486,720,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2536/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=486,912,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2537/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=487,104,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2538/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=487,296,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2539/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=487,488,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2540/500000]
+ optim/total_grad_norm=2.921
+ train/ActionNoiseL2Loss=0.1805
+ throughput/total_tokens=487,680,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2541/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=487,872,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2542/500000]
+ train/ActionNoiseL2Loss=0.1788
+ throughput/total_tokens=488,064,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2543/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=488,256,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2544/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=488,448,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2545/500000]
+ train/ActionNoiseL2Loss=0.1763
+ throughput/total_tokens=488,640,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2546/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=488,832,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2547/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=489,024,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2548/500000]
+ train/ActionNoiseL2Loss=0.1239
+ throughput/total_tokens=489,216,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2549/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=489,408,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2550/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=489,600,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2551/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=489,792,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2552/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=489,984,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2553/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=490,176,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2554/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=490,368,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2555/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=490,560,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2556/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=490,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2557/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=490,944,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2558/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=491,136,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2559/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=491,328,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2560/500000]
+ optim/total_grad_norm=2.338
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=491,520,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=2561/500000]
+ train/ActionNoiseL2Loss=0.1611
+ throughput/total_tokens=491,712,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2562/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=491,904,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2563/500000]
+ train/ActionNoiseL2Loss=0.1469
+ throughput/total_tokens=492,096,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2564/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=492,288,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2565/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=492,480,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2566/500000]
+ train/ActionNoiseL2Loss=0.2544
+ throughput/total_tokens=492,672,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2567/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=492,864,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2568/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=493,056,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=2569/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=493,248,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=2570/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=493,440,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=2571/500000]
+ train/ActionNoiseL2Loss=0.1711
+ throughput/total_tokens=493,632,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2572/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=493,824,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2573/500000]
+ train/ActionNoiseL2Loss=0.1951
+ throughput/total_tokens=494,016,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2574/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=494,208,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2575/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=494,400,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2576/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=494,592,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2577/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=494,784,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2578/500000]
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=494,976,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2579/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=495,168,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2580/500000]
+ optim/total_grad_norm=1.680
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=495,360,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2581/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=495,552,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2582/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=495,744,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2583/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=495,936,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2584/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=496,128,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2585/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=496,320,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2586/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=496,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2587/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=496,704,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2588/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=496,896,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2589/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=497,088,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2590/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=497,280,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2591/500000]
+ train/ActionNoiseL2Loss=0.1685
+ throughput/total_tokens=497,472,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2592/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=497,664,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2593/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=497,856,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2594/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=498,048,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2595/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=498,240,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2596/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=498,432,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2597/500000]
+ train/ActionNoiseL2Loss=0.1925
+ throughput/total_tokens=498,624,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2598/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=498,816,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2599/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=499,008,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2600/500000]
+ optim/total_grad_norm=2.410
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=499,200,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2601/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=499,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2602/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=499,584,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2603/500000]
+ train/ActionNoiseL2Loss=0.1880
+ throughput/total_tokens=499,776,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2604/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=499,968,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2605/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=500,160,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2606/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=500,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2607/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=500,544,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2608/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=500,736,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2609/500000]
+ train/ActionNoiseL2Loss=0.1966
+ throughput/total_tokens=500,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2610/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=501,120,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2611/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=501,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2612/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=501,504,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2613/500000]
+ train/ActionNoiseL2Loss=0.1607
+ throughput/total_tokens=501,696,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2614/500000]
+ train/ActionNoiseL2Loss=0.1609
+ throughput/total_tokens=501,888,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2615/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=502,080,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2616/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=502,272,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2617/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=502,464,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2618/500000]
+ train/ActionNoiseL2Loss=0.1639
+ throughput/total_tokens=502,656,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2619/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=502,848,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2620/500000]
+ optim/total_grad_norm=1.650
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=503,040,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2621/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=503,232,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2622/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=503,424,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2623/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=503,616,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2624/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=503,808,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2625/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=504,000,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2626/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=504,192,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2627/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=504,384,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2628/500000]
+ train/ActionNoiseL2Loss=0.1461
+ throughput/total_tokens=504,576,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2629/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=504,768,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2630/500000]
+ train/ActionNoiseL2Loss=0.1255
+ throughput/total_tokens=504,960,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2631/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=505,152,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2632/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=505,344,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2633/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=505,536,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2634/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=505,728,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2635/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=505,920,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2636/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=506,112,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2637/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=506,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2638/500000]
+ train/ActionNoiseL2Loss=0.2124
+ throughput/total_tokens=506,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2639/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=506,688,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2640/500000]
+ optim/total_grad_norm=2.234
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=506,880,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2641/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=507,072,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2642/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=507,264,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2643/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=507,456,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2644/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=507,648,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2645/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=507,840,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2646/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=508,032,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2647/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=508,224,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2648/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=508,416,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2649/500000]
+ train/ActionNoiseL2Loss=0.1425
+ throughput/total_tokens=508,608,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2650/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=508,800,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2651/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=508,992,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2652/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=509,184,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2653/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=509,376,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2654/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=509,568,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2655/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=509,760,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2656/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=509,952,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2657/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=510,144,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2658/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=510,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2659/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=510,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2660/500000]
+ optim/total_grad_norm=2.194
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=510,720,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2661/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=510,912,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2662/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=511,104,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2663/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=511,296,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2664/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=511,488,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2665/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=511,680,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2666/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=511,872,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2667/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=512,064,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2668/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=512,256,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2669/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=512,448,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2670/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=512,640,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2671/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=512,832,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2672/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=513,024,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2673/500000]
+ train/ActionNoiseL2Loss=0.1998
+ throughput/total_tokens=513,216,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2674/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=513,408,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2675/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=513,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2676/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=513,792,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2677/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=513,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2678/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=514,176,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2679/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=514,368,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2680/500000]
+ optim/total_grad_norm=1.821
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=514,560,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2681/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=514,752,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2682/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=514,944,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2683/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=515,136,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2684/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=515,328,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2685/500000]
+ train/ActionNoiseL2Loss=0.1593
+ throughput/total_tokens=515,520,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2686/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=515,712,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2687/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=515,904,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2688/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=516,096,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2689/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=516,288,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2690/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=516,480,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=2691/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=516,672,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2692/500000]
+ train/ActionNoiseL2Loss=0.1500
+ throughput/total_tokens=516,864,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2693/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=517,056,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=2694/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=517,248,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2695/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=517,440,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2696/500000]
+ train/ActionNoiseL2Loss=0.1872
+ throughput/total_tokens=517,632,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2697/500000]
+ train/ActionNoiseL2Loss=0.1481
+ throughput/total_tokens=517,824,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2698/500000]
+ train/ActionNoiseL2Loss=0.1249
+ throughput/total_tokens=518,016,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2699/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=518,208,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2700/500000]
+ optim/total_grad_norm=2.171
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=518,400,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=2701/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=518,592,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=2702/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=518,784,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2703/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=518,976,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2704/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=519,168,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2705/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=519,360,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2706/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=519,552,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2707/500000]
+ train/ActionNoiseL2Loss=0.1255
+ throughput/total_tokens=519,744,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2708/500000]
+ train/ActionNoiseL2Loss=0.1249
+ throughput/total_tokens=519,936,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2709/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=520,128,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2710/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=520,320,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2711/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=520,512,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2712/500000]
+ train/ActionNoiseL2Loss=0.1916
+ throughput/total_tokens=520,704,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2713/500000]
+ train/ActionNoiseL2Loss=0.2345
+ throughput/total_tokens=520,896,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2714/500000]
+ train/ActionNoiseL2Loss=0.1788
+ throughput/total_tokens=521,088,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2715/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=521,280,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2716/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=521,472,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2717/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=521,664,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2718/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=521,856,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2719/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=522,048,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2720/500000]
+ optim/total_grad_norm=3.012
+ train/ActionNoiseL2Loss=0.2005
+ throughput/total_tokens=522,240,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2721/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=522,432,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2722/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=522,624,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2723/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=522,816,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2724/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=523,008,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2725/500000]
+ train/ActionNoiseL2Loss=0.1466
+ throughput/total_tokens=523,200,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2726/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=523,392,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2727/500000]
+ train/ActionNoiseL2Loss=0.1475
+ throughput/total_tokens=523,584,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2728/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=523,776,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2729/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=523,968,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2730/500000]
+ train/ActionNoiseL2Loss=0.1684
+ throughput/total_tokens=524,160,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2731/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=524,352,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2732/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=524,544,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2733/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=524,736,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2734/500000]
+ train/ActionNoiseL2Loss=0.1475
+ throughput/total_tokens=524,928,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2735/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=525,120,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2736/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=525,312,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2737/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=525,504,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2738/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=525,696,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2739/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=525,888,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2740/500000]
+ optim/total_grad_norm=1.935
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=526,080,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2741/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=526,272,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2742/500000]
+ train/ActionNoiseL2Loss=0.1545
+ throughput/total_tokens=526,464,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2743/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=526,656,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2744/500000]
+ train/ActionNoiseL2Loss=0.1896
+ throughput/total_tokens=526,848,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2745/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=527,040,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2746/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=527,232,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2747/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=527,424,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2748/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=527,616,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2749/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=527,808,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2750/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=528,000,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2751/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=528,192,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2752/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=528,384,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2753/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=528,576,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2754/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=528,768,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2755/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=528,960,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2756/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=529,152,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2757/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=529,344,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2758/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=529,536,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2759/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=529,728,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2760/500000]
+ optim/total_grad_norm=3.052
+ train/ActionNoiseL2Loss=0.1723
+ throughput/total_tokens=529,920,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2761/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=530,112,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2762/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=530,304,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2763/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=530,496,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2764/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=530,688,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2765/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=530,880,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2766/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=531,072,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2767/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=531,264,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2768/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=531,456,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2769/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=531,648,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2770/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=531,840,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2771/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=532,032,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2772/500000]
+ train/ActionNoiseL2Loss=0.1642
+ throughput/total_tokens=532,224,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2773/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=532,416,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2774/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=532,608,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2775/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=532,800,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2776/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=532,992,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2777/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=533,184,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2778/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=533,376,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2779/500000]
+ train/ActionNoiseL2Loss=0.1800
+ throughput/total_tokens=533,568,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2780/500000]
+ optim/total_grad_norm=1.811
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=533,760,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2781/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=533,952,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2782/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=534,144,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2783/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=534,336,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2784/500000]
+ train/ActionNoiseL2Loss=0.1513
+ throughput/total_tokens=534,528,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2785/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=534,720,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2786/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=534,912,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2787/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=535,104,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2788/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=535,296,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2789/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=535,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2790/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=535,680,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2791/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=535,872,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2792/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=536,064,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2793/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=536,256,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2794/500000]
+ train/ActionNoiseL2Loss=0.1411
+ throughput/total_tokens=536,448,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2795/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=536,640,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2796/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=536,832,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2797/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=537,024,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2798/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=537,216,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2799/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=537,408,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2800/500000]
+ optim/total_grad_norm=2.606
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=537,600,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2801/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=537,792,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2802/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=537,984,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=2803/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=538,176,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2804/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=538,368,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=2805/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=538,560,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2806/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=538,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2807/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=538,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2808/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=539,136,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2809/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=539,328,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2810/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=539,520,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2811/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=539,712,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2812/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=539,904,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2813/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=540,096,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2814/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=540,288,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2815/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=540,480,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2816/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=540,672,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2817/500000]
+ train/ActionNoiseL2Loss=0.1479
+ throughput/total_tokens=540,864,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2818/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=541,056,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2819/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=541,248,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2820/500000]
+ optim/total_grad_norm=1.874
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=541,440,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2821/500000]
+ train/ActionNoiseL2Loss=0.1855
+ throughput/total_tokens=541,632,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2822/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=541,824,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=2823/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=542,016,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2824/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=542,208,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2825/500000]
+ train/ActionNoiseL2Loss=0.1962
+ throughput/total_tokens=542,400,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2826/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=542,592,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2827/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=542,784,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2828/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=542,976,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2829/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=543,168,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2830/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=543,360,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2831/500000]
+ train/ActionNoiseL2Loss=0.1403
+ throughput/total_tokens=543,552,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2832/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=543,744,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2833/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=543,936,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2834/500000]
+ train/ActionNoiseL2Loss=0.1968
+ throughput/total_tokens=544,128,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2835/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=544,320,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2836/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=544,512,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2837/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=544,704,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2838/500000]
+ train/ActionNoiseL2Loss=0.1880
+ throughput/total_tokens=544,896,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2839/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=545,088,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2840/500000]
+ optim/total_grad_norm=2.142
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=545,280,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2841/500000]
+ train/ActionNoiseL2Loss=0.1521
+ throughput/total_tokens=545,472,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2842/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=545,664,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2843/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=545,856,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2844/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=546,048,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2845/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=546,240,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2846/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=546,432,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2847/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=546,624,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2848/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=546,816,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2849/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=547,008,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2850/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=547,200,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2851/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=547,392,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=2852/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=547,584,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2853/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=547,776,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2854/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=547,968,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2855/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=548,160,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=2856/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=548,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2857/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=548,544,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2858/500000]
+ train/ActionNoiseL2Loss=0.1627
+ throughput/total_tokens=548,736,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2859/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=548,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2860/500000]
+ optim/total_grad_norm=2.284
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=549,120,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2861/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=549,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2862/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=549,504,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2863/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=549,696,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2864/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=549,888,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2865/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=550,080,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2866/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=550,272,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2867/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=550,464,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2868/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=550,656,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2869/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=550,848,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2870/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=551,040,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2871/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=551,232,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2872/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=551,424,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2873/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=551,616,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2874/500000]
+ train/ActionNoiseL2Loss=0.1501
+ throughput/total_tokens=551,808,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2875/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=552,000,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2876/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=552,192,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2877/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=552,384,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2878/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=552,576,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2879/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=552,768,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2880/500000]
+ optim/total_grad_norm=1.651
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=552,960,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2881/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=553,152,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2882/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=553,344,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2883/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=553,536,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2884/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=553,728,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2885/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=553,920,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2886/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=554,112,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2887/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=554,304,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2888/500000]
+ train/ActionNoiseL2Loss=0.2186
+ throughput/total_tokens=554,496,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2889/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=554,688,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2890/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=554,880,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2891/500000]
+ train/ActionNoiseL2Loss=0.1398
+ throughput/total_tokens=555,072,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2892/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=555,264,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2893/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=555,456,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2894/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=555,648,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2895/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=555,840,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2896/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=556,032,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2897/500000]
+ train/ActionNoiseL2Loss=0.1617
+ throughput/total_tokens=556,224,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=2898/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=556,416,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2899/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=556,608,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2900/500000]
+ optim/total_grad_norm=1.783
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=556,800,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2901/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=556,992,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2902/500000]
+ train/ActionNoiseL2Loss=0.1607
+ throughput/total_tokens=557,184,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2903/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=557,376,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2904/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=557,568,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2905/500000]
+ train/ActionNoiseL2Loss=0.2146
+ throughput/total_tokens=557,760,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2906/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=557,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2907/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=558,144,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2908/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=558,336,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2909/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=558,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2910/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=558,720,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=2911/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=558,912,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2912/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=559,104,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2913/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=559,296,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2914/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=559,488,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2915/500000]
+ train/ActionNoiseL2Loss=0.1587
+ throughput/total_tokens=559,680,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2916/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=559,872,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2917/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=560,064,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2918/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=560,256,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=2919/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=560,448,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=2920/500000]
+ optim/total_grad_norm=1.767
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=560,640,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2921/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=560,832,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2922/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=561,024,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2923/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=561,216,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2924/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=561,408,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2925/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=561,600,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2926/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=561,792,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2927/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=561,984,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2928/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=562,176,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2929/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=562,368,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2930/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=562,560,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2931/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=562,752,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2932/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=562,944,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2933/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=563,136,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2934/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=563,328,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2935/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=563,520,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2936/500000]
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=563,712,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2937/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=563,904,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2938/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=564,096,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2939/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=564,288,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2940/500000]
+ optim/total_grad_norm=2.080
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=564,480,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2941/500000]
+ train/ActionNoiseL2Loss=0.1451
+ throughput/total_tokens=564,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2942/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=564,864,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2943/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=565,056,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2944/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=565,248,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2945/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=565,440,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2946/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=565,632,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2947/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=565,824,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2948/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=566,016,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2949/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=566,208,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2950/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=566,400,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2951/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=566,592,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2952/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=566,784,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2953/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=566,976,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2954/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=567,168,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2955/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=567,360,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2956/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=567,552,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2957/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=567,744,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2958/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=567,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2959/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=568,128,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2960/500000]
+ optim/total_grad_norm=2.321
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=568,320,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=2961/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=568,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2962/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=568,704,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2963/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=568,896,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2964/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=569,088,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2965/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=569,280,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2966/500000]
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=569,472,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=2967/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=569,664,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2968/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=569,856,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2969/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=570,048,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=2970/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=570,240,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2971/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=570,432,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2972/500000]
+ train/ActionNoiseL2Loss=0.1994
+ throughput/total_tokens=570,624,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2973/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=570,816,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2974/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=571,008,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2975/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=571,200,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2976/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=571,392,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2977/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=571,584,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2978/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=571,776,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2979/500000]
+ train/ActionNoiseL2Loss=0.1367
+ throughput/total_tokens=571,968,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2980/500000]
+ optim/total_grad_norm=1.845
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=572,160,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2981/500000]
+ train/ActionNoiseL2Loss=0.1737
+ throughput/total_tokens=572,352,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2982/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=572,544,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=2983/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=572,736,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2984/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=572,928,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2985/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=573,120,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2986/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=573,312,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2987/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=573,504,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2988/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=573,696,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2989/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=573,888,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2990/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=574,080,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=2991/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=574,272,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2992/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=574,464,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2993/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=574,656,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2994/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=574,848,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2995/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=575,040,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2996/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=575,232,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2997/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=575,424,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2998/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=575,616,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=2999/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=575,808,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3000/500000]
+ optim/total_grad_norm=2.532
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=576,000,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+09/29 [05:03:17] INFO | >> Saving config... checkpoint.py:608
+09/29 [05:03:49] INFO | >> Saving model state... checkpoint.py:796
+09/29 [05:04:51] INFO | >> Saving optim state... checkpoint.py:811
+09/29 [05:04:56] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3001/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=576,192,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3002/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=576,384,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3003/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=576,576,000
+ throughput/device/tokens_per_second=1,081
+ throughput/device/batches_per_second=0.0451
+[step=3004/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=576,768,000
+ throughput/device/tokens_per_second=1,089
+ throughput/device/batches_per_second=0.0454
+[step=3005/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=576,960,000
+ throughput/device/tokens_per_second=1,094
+ throughput/device/batches_per_second=0.0456
+[step=3006/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=577,152,000
+ throughput/device/tokens_per_second=1,098
+ throughput/device/batches_per_second=0.0458
+[step=3007/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=577,344,000
+ throughput/device/tokens_per_second=1,101
+ throughput/device/batches_per_second=0.0459
+[step=3008/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=577,536,000
+ throughput/device/tokens_per_second=1,103
+ throughput/device/batches_per_second=0.0460
+[step=3009/500000]
+ train/ActionNoiseL2Loss=0.1324
+ throughput/total_tokens=577,728,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=3010/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=577,920,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,547
+[step=3011/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=578,112,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3012/500000]
+ train/ActionNoiseL2Loss=0.2005
+ throughput/total_tokens=578,304,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0462
+[step=3013/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=578,496,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=3014/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=578,688,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3015/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=578,880,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3016/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=579,072,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3017/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=579,264,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3018/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=579,456,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3019/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=579,648,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3020/500000]
+ optim/total_grad_norm=2.981
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=579,840,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=3021/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=580,032,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3022/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=580,224,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3023/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=580,416,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3024/500000]
+ train/ActionNoiseL2Loss=0.1327
+ throughput/total_tokens=580,608,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3025/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=580,800,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3026/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=580,992,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3027/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=581,184,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3028/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=581,376,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3029/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=581,568,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3030/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=581,760,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3031/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=581,952,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3032/500000]
+ train/ActionNoiseL2Loss=0.1398
+ throughput/total_tokens=582,144,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=3033/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=582,336,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=3034/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=582,528,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3035/500000]
+ train/ActionNoiseL2Loss=0.1705
+ throughput/total_tokens=582,720,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3036/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=582,912,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3037/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=583,104,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3038/500000]
+ train/ActionNoiseL2Loss=0.1410
+ throughput/total_tokens=583,296,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3039/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=583,488,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3040/500000]
+ optim/total_grad_norm=2.264
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=583,680,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=3041/500000]
+ train/ActionNoiseL2Loss=0.2025
+ throughput/total_tokens=583,872,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3042/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=584,064,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3043/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=584,256,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3044/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=584,448,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3045/500000]
+ train/ActionNoiseL2Loss=0.1324
+ throughput/total_tokens=584,640,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3046/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=584,832,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3047/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=585,024,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3048/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=585,216,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3049/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=585,408,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3050/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=585,600,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3051/500000]
+ train/ActionNoiseL2Loss=0.1255
+ throughput/total_tokens=585,792,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3052/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=585,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3053/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=586,176,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3054/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=586,368,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3055/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=586,560,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3056/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=586,752,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3057/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=586,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3058/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=587,136,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3059/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=587,328,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3060/500000]
+ optim/total_grad_norm=1.594
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=587,520,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3061/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=587,712,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3062/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=587,904,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3063/500000]
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=588,096,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3064/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=588,288,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3065/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=588,480,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3066/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=588,672,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3067/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=588,864,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3068/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=589,056,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3069/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=589,248,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3070/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=589,440,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3071/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=589,632,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3072/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=589,824,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3073/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=590,016,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3074/500000]
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=590,208,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3075/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=590,400,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3076/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=590,592,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3077/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=590,784,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3078/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=590,976,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3079/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=591,168,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3080/500000]
+ optim/total_grad_norm=1.834
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=591,360,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3081/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=591,552,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3082/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=591,744,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3083/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=591,936,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3084/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=592,128,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3085/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=592,320,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3086/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=592,512,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3087/500000]
+ train/ActionNoiseL2Loss=0.2089
+ throughput/total_tokens=592,704,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3088/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=592,896,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3089/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=593,088,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3090/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=593,280,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3091/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=593,472,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3092/500000]
+ train/ActionNoiseL2Loss=0.1481
+ throughput/total_tokens=593,664,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3093/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=593,856,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3094/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=594,048,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3095/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=594,240,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3096/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=594,432,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3097/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=594,624,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3098/500000]
+ train/ActionNoiseL2Loss=0.1566
+ throughput/total_tokens=594,816,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3099/500000]
+ train/ActionNoiseL2Loss=0.1682
+ throughput/total_tokens=595,008,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3100/500000]
+ optim/total_grad_norm=1.356
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=595,200,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3101/500000]
+ train/ActionNoiseL2Loss=0.1556
+ throughput/total_tokens=595,392,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3102/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=595,584,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3103/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=595,776,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3104/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=595,968,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3105/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=596,160,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3106/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=596,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3107/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=596,544,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3108/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=596,736,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3109/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=596,928,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3110/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=597,120,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=3111/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=597,312,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3112/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=597,504,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3113/500000]
+ train/ActionNoiseL2Loss=0.1534
+ throughput/total_tokens=597,696,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3114/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=597,888,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3115/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=598,080,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3116/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=598,272,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3117/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=598,464,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3118/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=598,656,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3119/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=598,848,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3120/500000]
+ optim/total_grad_norm=2.479
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=599,040,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=3121/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=599,232,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3122/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=599,424,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3123/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=599,616,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3124/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=599,808,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3125/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=600,000,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3126/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=600,192,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3127/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=600,384,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3128/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=600,576,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3129/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=600,768,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3130/500000]
+ train/ActionNoiseL2Loss=0.1920
+ throughput/total_tokens=600,960,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3131/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=601,152,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3132/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=601,344,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3133/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=601,536,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3134/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=601,728,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3135/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=601,920,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3136/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=602,112,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3137/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=602,304,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3138/500000]
+ train/ActionNoiseL2Loss=0.1783
+ throughput/total_tokens=602,496,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3139/500000]
+ train/ActionNoiseL2Loss=0.1373
+ throughput/total_tokens=602,688,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3140/500000]
+ optim/total_grad_norm=1.903
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=602,880,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3141/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=603,072,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3142/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=603,264,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3143/500000]
+ train/ActionNoiseL2Loss=0.1228
+ throughput/total_tokens=603,456,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3144/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=603,648,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3145/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=603,840,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3146/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=604,032,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3147/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=604,224,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3148/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=604,416,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3149/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=604,608,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3150/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=604,800,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3151/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=604,992,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3152/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=605,184,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3153/500000]
+ train/ActionNoiseL2Loss=0.1771
+ throughput/total_tokens=605,376,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3154/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=605,568,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3155/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=605,760,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3156/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=605,952,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3157/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=606,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3158/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=606,336,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3159/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=606,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3160/500000]
+ optim/total_grad_norm=2.104
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=606,720,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3161/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=606,912,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3162/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=607,104,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3163/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=607,296,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3164/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=607,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3165/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=607,680,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3166/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=607,872,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3167/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=608,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3168/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=608,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3169/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=608,448,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3170/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=608,640,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3171/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=608,832,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3172/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=609,024,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3173/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=609,216,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3174/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=609,408,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3175/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=609,600,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3176/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=609,792,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3177/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=609,984,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3178/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=610,176,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3179/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=610,368,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3180/500000]
+ optim/total_grad_norm=2.259
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=610,560,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3181/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=610,752,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3182/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=610,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3183/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=611,136,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3184/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=611,328,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3185/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=611,520,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3186/500000]
+ train/ActionNoiseL2Loss=0.1211
+ throughput/total_tokens=611,712,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=3187/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=611,904,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3188/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=612,096,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3189/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=612,288,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3190/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=612,480,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=3191/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=612,672,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3192/500000]
+ train/ActionNoiseL2Loss=0.1746
+ throughput/total_tokens=612,864,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3193/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=613,056,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3194/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=613,248,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3195/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=613,440,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3196/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=613,632,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3197/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=613,824,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3198/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=614,016,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3199/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=614,208,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3200/500000]
+ optim/total_grad_norm=2.021
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=614,400,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=3201/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=614,592,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3202/500000]
+ train/ActionNoiseL2Loss=0.1653
+ throughput/total_tokens=614,784,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3203/500000]
+ train/ActionNoiseL2Loss=0.1757
+ throughput/total_tokens=614,976,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3204/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=615,168,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3205/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=615,360,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3206/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=615,552,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3207/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=615,744,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3208/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=615,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3209/500000]
+ train/ActionNoiseL2Loss=0.1753
+ throughput/total_tokens=616,128,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3210/500000]
+ train/ActionNoiseL2Loss=0.1623
+ throughput/total_tokens=616,320,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3211/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=616,512,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3212/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=616,704,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3213/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=616,896,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3214/500000]
+ train/ActionNoiseL2Loss=0.1756
+ throughput/total_tokens=617,088,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3215/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=617,280,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3216/500000]
+ train/ActionNoiseL2Loss=0.1403
+ throughput/total_tokens=617,472,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3217/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=617,664,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3218/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=617,856,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3219/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=618,048,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3220/500000]
+ optim/total_grad_norm=1.612
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=618,240,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3221/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=618,432,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3222/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=618,624,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3223/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=618,816,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3224/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=619,008,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3225/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=619,200,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3226/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=619,392,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3227/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=619,584,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3228/500000]
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=619,776,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3229/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=619,968,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3230/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=620,160,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3231/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=620,352,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3232/500000]
+ train/ActionNoiseL2Loss=0.1986
+ throughput/total_tokens=620,544,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3233/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=620,736,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3234/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=620,928,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3235/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=621,120,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3236/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=621,312,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3237/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=621,504,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3238/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=621,696,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3239/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=621,888,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3240/500000]
+ optim/total_grad_norm=2.205
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=622,080,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3241/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=622,272,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3242/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=622,464,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3243/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=622,656,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3244/500000]
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=622,848,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3245/500000]
+ train/ActionNoiseL2Loss=0.1427
+ throughput/total_tokens=623,040,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3246/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=623,232,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3247/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=623,424,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3248/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=623,616,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3249/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=623,808,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3250/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=624,000,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3251/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=624,192,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3252/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=624,384,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3253/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=624,576,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3254/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=624,768,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3255/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=624,960,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3256/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=625,152,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3257/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=625,344,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3258/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=625,536,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3259/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=625,728,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3260/500000]
+ optim/total_grad_norm=1.639
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=625,920,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3261/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=626,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3262/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=626,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3263/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=626,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3264/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=626,688,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3265/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=626,880,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3266/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=627,072,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3267/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=627,264,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3268/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=627,456,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3269/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=627,648,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3270/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=627,840,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3271/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=628,032,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3272/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=628,224,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3273/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=628,416,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3274/500000]
+ train/ActionNoiseL2Loss=0.1668
+ throughput/total_tokens=628,608,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3275/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=628,800,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3276/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=628,992,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3277/500000]
+ train/ActionNoiseL2Loss=0.1367
+ throughput/total_tokens=629,184,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3278/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=629,376,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3279/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=629,568,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3280/500000]
+ optim/total_grad_norm=2.449
+ train/ActionNoiseL2Loss=0.1658
+ throughput/total_tokens=629,760,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3281/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=629,952,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3282/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=630,144,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3283/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=630,336,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3284/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=630,528,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3285/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=630,720,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3286/500000]
+ train/ActionNoiseL2Loss=0.2423
+ throughput/total_tokens=630,912,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3287/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=631,104,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3288/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=631,296,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3289/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=631,488,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3290/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=631,680,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3291/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=631,872,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3292/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=632,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3293/500000]
+ train/ActionNoiseL2Loss=0.1400
+ throughput/total_tokens=632,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3294/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=632,448,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3295/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=632,640,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3296/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=632,832,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3297/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=633,024,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3298/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=633,216,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3299/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=633,408,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3300/500000]
+ optim/total_grad_norm=2.474
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=633,600,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3301/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=633,792,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3302/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=633,984,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3303/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=634,176,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3304/500000]
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=634,368,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3305/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=634,560,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3306/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=634,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3307/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=634,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3308/500000]
+ train/ActionNoiseL2Loss=0.2085
+ throughput/total_tokens=635,136,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3309/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=635,328,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3310/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=635,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3311/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=635,712,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3312/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=635,904,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3313/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=636,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3314/500000]
+ train/ActionNoiseL2Loss=0.1386
+ throughput/total_tokens=636,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3315/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=636,480,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3316/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=636,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3317/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=636,864,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3318/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=637,056,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3319/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=637,248,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3320/500000]
+ optim/total_grad_norm=2.004
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=637,440,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3321/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=637,632,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3322/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=637,824,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3323/500000]
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=638,016,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3324/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=638,208,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3325/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=638,400,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3326/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=638,592,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3327/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=638,784,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3328/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=638,976,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3329/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=639,168,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3330/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=639,360,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3331/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=639,552,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3332/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=639,744,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3333/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=639,936,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3334/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=640,128,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3335/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=640,320,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3336/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=640,512,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3337/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=640,704,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3338/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=640,896,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3339/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=641,088,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3340/500000]
+ optim/total_grad_norm=2.162
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=641,280,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3341/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=641,472,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3342/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=641,664,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3343/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=641,856,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3344/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=642,048,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3345/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=642,240,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3346/500000]
+ train/ActionNoiseL2Loss=0.1632
+ throughput/total_tokens=642,432,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3347/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=642,624,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3348/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=642,816,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3349/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=643,008,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3350/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=643,200,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3351/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=643,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3352/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=643,584,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3353/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=643,776,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3354/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=643,968,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3355/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=644,160,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3356/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=644,352,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3357/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=644,544,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3358/500000]
+ train/ActionNoiseL2Loss=0.2000
+ throughput/total_tokens=644,736,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3359/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=644,928,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=3360/500000]
+ optim/total_grad_norm=1.685
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=645,120,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,547
+[step=3361/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=645,312,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3362/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=645,504,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3363/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=645,696,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3364/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=645,888,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3365/500000]
+ train/ActionNoiseL2Loss=0.2255
+ throughput/total_tokens=646,080,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3366/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=646,272,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3367/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=646,464,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3368/500000]
+ train/ActionNoiseL2Loss=0.1356
+ throughput/total_tokens=646,656,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3369/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=646,848,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3370/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=647,040,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,547
+[step=3371/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=647,232,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3372/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=647,424,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3373/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=647,616,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=3374/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=647,808,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3375/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=648,000,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3376/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=648,192,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3377/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=648,384,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3378/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=648,576,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3379/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=648,768,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3380/500000]
+ optim/total_grad_norm=1.923
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=648,960,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3381/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=649,152,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3382/500000]
+ train/ActionNoiseL2Loss=0.1503
+ throughput/total_tokens=649,344,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3383/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=649,536,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3384/500000]
+ train/ActionNoiseL2Loss=0.1512
+ throughput/total_tokens=649,728,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3385/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=649,920,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3386/500000]
+ train/ActionNoiseL2Loss=0.1324
+ throughput/total_tokens=650,112,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3387/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=650,304,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3388/500000]
+ train/ActionNoiseL2Loss=0.1327
+ throughput/total_tokens=650,496,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3389/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=650,688,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3390/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=650,880,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3391/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=651,072,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3392/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=651,264,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3393/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=651,456,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3394/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=651,648,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3395/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=651,840,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3396/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=652,032,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3397/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=652,224,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3398/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=652,416,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3399/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=652,608,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3400/500000]
+ optim/total_grad_norm=1.972
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=652,800,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3401/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=652,992,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3402/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=653,184,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3403/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=653,376,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3404/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=653,568,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3405/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=653,760,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3406/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=653,952,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3407/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=654,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3408/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=654,336,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3409/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=654,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3410/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=654,720,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3411/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=654,912,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3412/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=655,104,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3413/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=655,296,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3414/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=655,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3415/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=655,680,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3416/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=655,872,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3417/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=656,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3418/500000]
+ train/ActionNoiseL2Loss=0.1427
+ throughput/total_tokens=656,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3419/500000]
+ train/ActionNoiseL2Loss=0.2075
+ throughput/total_tokens=656,448,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3420/500000]
+ optim/total_grad_norm=1.913
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=656,640,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3421/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=656,832,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3422/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=657,024,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3423/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=657,216,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3424/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=657,408,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3425/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=657,600,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3426/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=657,792,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3427/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=657,984,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3428/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=658,176,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3429/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=658,368,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3430/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=658,560,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3431/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=658,752,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3432/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=658,944,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3433/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=659,136,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3434/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=659,328,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3435/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=659,520,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3436/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=659,712,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3437/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=659,904,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3438/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=660,096,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3439/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=660,288,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3440/500000]
+ optim/total_grad_norm=2.273
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=660,480,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3441/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=660,672,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3442/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=660,864,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3443/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=661,056,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3444/500000]
+ train/ActionNoiseL2Loss=0.1573
+ throughput/total_tokens=661,248,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3445/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=661,440,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3446/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=661,632,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3447/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=661,824,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3448/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=662,016,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3449/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=662,208,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3450/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=662,400,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3451/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=662,592,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=3452/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=662,784,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=3453/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=662,976,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=3454/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=663,168,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3455/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=663,360,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3456/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=663,552,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3457/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=663,744,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3458/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=663,936,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3459/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=664,128,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3460/500000]
+ optim/total_grad_norm=2.227
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=664,320,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,547
+[step=3461/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=664,512,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3462/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=664,704,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3463/500000]
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=664,896,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3464/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=665,088,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3465/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=665,280,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3466/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=665,472,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3467/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=665,664,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3468/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=665,856,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3469/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=666,048,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3470/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=666,240,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3471/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=666,432,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3472/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=666,624,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=3473/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=666,816,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3474/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=667,008,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3475/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=667,200,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3476/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=667,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3477/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=667,584,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3478/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=667,776,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3479/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=667,968,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3480/500000]
+ optim/total_grad_norm=1.784
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=668,160,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3481/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=668,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3482/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=668,544,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3483/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=668,736,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3484/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=668,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3485/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=669,120,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3486/500000]
+ train/ActionNoiseL2Loss=0.1534
+ throughput/total_tokens=669,312,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3487/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=669,504,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3488/500000]
+ train/ActionNoiseL2Loss=0.1815
+ throughput/total_tokens=669,696,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3489/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=669,888,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3490/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=670,080,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3491/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=670,272,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3492/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=670,464,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3493/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=670,656,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3494/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=670,848,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3495/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=671,040,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3496/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=671,232,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3497/500000]
+ train/ActionNoiseL2Loss=0.2125
+ throughput/total_tokens=671,424,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3498/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=671,616,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3499/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=671,808,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3500/500000]
+ optim/total_grad_norm=2.004
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=672,000,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+09/29 [08:05:28] INFO | >> Saving config... checkpoint.py:608
+09/29 [08:05:56] INFO | >> Saving model state... checkpoint.py:796
+09/29 [08:06:59] INFO | >> Saving optim state... checkpoint.py:811
+09/29 [08:07:04] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3501/500000]
+ train/ActionNoiseL2Loss=0.1161
+ throughput/total_tokens=672,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3502/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=672,384,000
+ throughput/device/tokens_per_second=1,103
+ throughput/device/batches_per_second=0.0460
+[step=3503/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=672,576,000
+ throughput/device/tokens_per_second=1,030
+ throughput/device/batches_per_second=0.0429
+[step=3504/500000]
+ train/ActionNoiseL2Loss=0.1638
+ throughput/total_tokens=672,768,000
+ throughput/device/tokens_per_second=1,044
+ throughput/device/batches_per_second=0.0435
+[step=3505/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=672,960,000
+ throughput/device/tokens_per_second=1,058
+ throughput/device/batches_per_second=0.0441
+[step=3506/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=673,152,000
+ throughput/device/tokens_per_second=1,068
+ throughput/device/batches_per_second=0.0445
+[step=3507/500000]
+ train/ActionNoiseL2Loss=0.1369
+ throughput/total_tokens=673,344,000
+ throughput/device/tokens_per_second=1,075
+ throughput/device/batches_per_second=0.0448
+[step=3508/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=673,536,000
+ throughput/device/tokens_per_second=1,079
+ throughput/device/batches_per_second=0.0450
+[step=3509/500000]
+ train/ActionNoiseL2Loss=0.1624
+ throughput/total_tokens=673,728,000
+ throughput/device/tokens_per_second=1,084
+ throughput/device/batches_per_second=0.0452
+[step=3510/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=673,920,000
+ throughput/device/tokens_per_second=1,087
+ throughput/device/batches_per_second=0.0453
+ System/Peak GPU Memory (MB)=44,547
+[step=3511/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=674,112,000
+ throughput/device/tokens_per_second=1,090
+ throughput/device/batches_per_second=0.0454
+[step=3512/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=674,304,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3513/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=674,496,000
+ throughput/device/tokens_per_second=1,094
+ throughput/device/batches_per_second=0.0456
+[step=3514/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=674,688,000
+ throughput/device/tokens_per_second=1,095
+ throughput/device/batches_per_second=0.0457
+[step=3515/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=674,880,000
+ throughput/device/tokens_per_second=1,097
+ throughput/device/batches_per_second=0.0457
+[step=3516/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=675,072,000
+ throughput/device/tokens_per_second=1,098
+ throughput/device/batches_per_second=0.0458
+[step=3517/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=675,264,000
+ throughput/device/tokens_per_second=1,099
+ throughput/device/batches_per_second=0.0458
+[step=3518/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=675,456,000
+ throughput/device/tokens_per_second=1,100
+ throughput/device/batches_per_second=0.0459
+[step=3519/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=675,648,000
+ throughput/device/tokens_per_second=1,101
+ throughput/device/batches_per_second=0.0459
+[step=3520/500000]
+ optim/total_grad_norm=2.430
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=675,840,000
+ throughput/device/tokens_per_second=1,101
+ throughput/device/batches_per_second=0.0459
+ System/Peak GPU Memory (MB)=44,547
+[step=3521/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=676,032,000
+ throughput/device/tokens_per_second=1,101
+ throughput/device/batches_per_second=0.0459
+[step=3522/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=676,224,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=3523/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=676,416,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3524/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=676,608,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3525/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=676,800,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3526/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=676,992,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3527/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=677,184,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3528/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=677,376,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3529/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=677,568,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3530/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=677,760,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=3531/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=677,952,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3532/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=678,144,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3533/500000]
+ train/ActionNoiseL2Loss=0.2061
+ throughput/total_tokens=678,336,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3534/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=678,528,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3535/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=678,720,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3536/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=678,912,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3537/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=679,104,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3538/500000]
+ train/ActionNoiseL2Loss=0.1665
+ throughput/total_tokens=679,296,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3539/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=679,488,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3540/500000]
+ optim/total_grad_norm=1.545
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=679,680,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=3541/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=679,872,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3542/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=680,064,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3543/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=680,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3544/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=680,448,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3545/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=680,640,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3546/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=680,832,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3547/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=681,024,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3548/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=681,216,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3549/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=681,408,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3550/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=681,600,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3551/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=681,792,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3552/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=681,984,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3553/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=682,176,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3554/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=682,368,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3555/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=682,560,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3556/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=682,752,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3557/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=682,944,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3558/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=683,136,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3559/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=683,328,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3560/500000]
+ optim/total_grad_norm=2.145
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=683,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3561/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=683,712,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3562/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=683,904,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3563/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=684,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3564/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=684,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3565/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=684,480,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3566/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=684,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3567/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=684,864,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3568/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=685,056,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3569/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=685,248,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3570/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=685,440,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3571/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=685,632,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3572/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=685,824,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3573/500000]
+ train/ActionNoiseL2Loss=0.1569
+ throughput/total_tokens=686,016,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3574/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=686,208,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3575/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=686,400,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3576/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=686,592,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3577/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=686,784,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3578/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=686,976,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3579/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=687,168,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3580/500000]
+ optim/total_grad_norm=1.490
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=687,360,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3581/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=687,552,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3582/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=687,744,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3583/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=687,936,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3584/500000]
+ train/ActionNoiseL2Loss=0.1568
+ throughput/total_tokens=688,128,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3585/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=688,320,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3586/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=688,512,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3587/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=688,704,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3588/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=688,896,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3589/500000]
+ train/ActionNoiseL2Loss=0.2143
+ throughput/total_tokens=689,088,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3590/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=689,280,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3591/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=689,472,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3592/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=689,664,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3593/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=689,856,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3594/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=690,048,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3595/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=690,240,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3596/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=690,432,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3597/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=690,624,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3598/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=690,816,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3599/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=691,008,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3600/500000]
+ optim/total_grad_norm=2.834
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=691,200,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3601/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=691,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3602/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=691,584,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3603/500000]
+ train/ActionNoiseL2Loss=0.1798
+ throughput/total_tokens=691,776,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3604/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=691,968,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3605/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=692,160,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3606/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=692,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3607/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=692,544,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3608/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=692,736,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3609/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=692,928,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3610/500000]
+ train/ActionNoiseL2Loss=0.1271
+ throughput/total_tokens=693,120,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3611/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=693,312,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3612/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=693,504,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3613/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=693,696,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3614/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=693,888,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3615/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=694,080,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3616/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=694,272,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3617/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=694,464,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3618/500000]
+ train/ActionNoiseL2Loss=0.1638
+ throughput/total_tokens=694,656,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3619/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=694,848,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3620/500000]
+ optim/total_grad_norm=1.988
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=695,040,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3621/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=695,232,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3622/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=695,424,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3623/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=695,616,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3624/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=695,808,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3625/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=696,000,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3626/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=696,192,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3627/500000]
+ train/ActionNoiseL2Loss=0.1831
+ throughput/total_tokens=696,384,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3628/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=696,576,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3629/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=696,768,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3630/500000]
+ train/ActionNoiseL2Loss=0.2043
+ throughput/total_tokens=696,960,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3631/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=697,152,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3632/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=697,344,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3633/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=697,536,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3634/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=697,728,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3635/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=697,920,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3636/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=698,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3637/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=698,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3638/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=698,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3639/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=698,688,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3640/500000]
+ optim/total_grad_norm=2.713
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=698,880,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3641/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=699,072,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3642/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=699,264,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3643/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=699,456,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3644/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=699,648,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3645/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=699,840,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3646/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=700,032,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3647/500000]
+ train/ActionNoiseL2Loss=0.2531
+ throughput/total_tokens=700,224,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3648/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=700,416,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3649/500000]
+ train/ActionNoiseL2Loss=0.1479
+ throughput/total_tokens=700,608,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3650/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=700,800,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3651/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=700,992,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3652/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=701,184,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3653/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=701,376,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3654/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=701,568,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3655/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=701,760,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3656/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=701,952,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3657/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=702,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3658/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=702,336,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3659/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=702,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3660/500000]
+ optim/total_grad_norm=1.437
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=702,720,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3661/500000]
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=702,912,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3662/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=703,104,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3663/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=703,296,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3664/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=703,488,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3665/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=703,680,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3666/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=703,872,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3667/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=704,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3668/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=704,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3669/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=704,448,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3670/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=704,640,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3671/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=704,832,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3672/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=705,024,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3673/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=705,216,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3674/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=705,408,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3675/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=705,600,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3676/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=705,792,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3677/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=705,984,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=3678/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=706,176,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3679/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=706,368,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3680/500000]
+ optim/total_grad_norm=2.640
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=706,560,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3681/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=706,752,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3682/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=706,944,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3683/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=707,136,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3684/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=707,328,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3685/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=707,520,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3686/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=707,712,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3687/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=707,904,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3688/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=708,096,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3689/500000]
+ train/ActionNoiseL2Loss=0.1570
+ throughput/total_tokens=708,288,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3690/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=708,480,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3691/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=708,672,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3692/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=708,864,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3693/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=709,056,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3694/500000]
+ train/ActionNoiseL2Loss=0.1925
+ throughput/total_tokens=709,248,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3695/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=709,440,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3696/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=709,632,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3697/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=709,824,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3698/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=710,016,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3699/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=710,208,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3700/500000]
+ optim/total_grad_norm=1.519
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=710,400,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3701/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=710,592,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3702/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=710,784,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3703/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=710,976,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3704/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=711,168,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3705/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=711,360,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3706/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=711,552,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3707/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=711,744,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3708/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=711,936,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3709/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=712,128,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3710/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=712,320,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3711/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=712,512,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3712/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=712,704,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3713/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=712,896,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3714/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=713,088,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3715/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=713,280,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3716/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=713,472,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3717/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=713,664,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3718/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=713,856,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3719/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=714,048,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3720/500000]
+ optim/total_grad_norm=2.133
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=714,240,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3721/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=714,432,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3722/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=714,624,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3723/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=714,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3724/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=715,008,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3725/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=715,200,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3726/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=715,392,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3727/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=715,584,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3728/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=715,776,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3729/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=715,968,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3730/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=716,160,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3731/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=716,352,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3732/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=716,544,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3733/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=716,736,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3734/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=716,928,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3735/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=717,120,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3736/500000]
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=717,312,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3737/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=717,504,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3738/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=717,696,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3739/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=717,888,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3740/500000]
+ optim/total_grad_norm=1.381
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=718,080,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3741/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=718,272,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3742/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=718,464,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3743/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=718,656,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3744/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=718,848,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3745/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=719,040,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3746/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=719,232,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3747/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=719,424,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3748/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=719,616,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3749/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=719,808,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3750/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=720,000,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=3751/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=720,192,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3752/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=720,384,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3753/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=720,576,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3754/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=720,768,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3755/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=720,960,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3756/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=721,152,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3757/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=721,344,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3758/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=721,536,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3759/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=721,728,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3760/500000]
+ optim/total_grad_norm=1.469
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=721,920,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=3761/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=722,112,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3762/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=722,304,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3763/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=722,496,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3764/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=722,688,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3765/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=722,880,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=3766/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=723,072,000
+ throughput/device/tokens_per_second=1,107
+ throughput/device/batches_per_second=0.0461
+[step=3767/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=723,264,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=3768/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=723,456,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=3769/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=723,648,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=3770/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=723,840,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3771/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=724,032,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3772/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=724,224,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3773/500000]
+ train/ActionNoiseL2Loss=0.1371
+ throughput/total_tokens=724,416,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3774/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=724,608,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3775/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=724,800,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3776/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=724,992,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3777/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=725,184,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3778/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=725,376,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3779/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=725,568,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3780/500000]
+ optim/total_grad_norm=2.138
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=725,760,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3781/500000]
+ train/ActionNoiseL2Loss=0.2176
+ throughput/total_tokens=725,952,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3782/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=726,144,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3783/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=726,336,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3784/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=726,528,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3785/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=726,720,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3786/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=726,912,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3787/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=727,104,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3788/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=727,296,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3789/500000]
+ train/ActionNoiseL2Loss=0.1627
+ throughput/total_tokens=727,488,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3790/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=727,680,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3791/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=727,872,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3792/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=728,064,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3793/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=728,256,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3794/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=728,448,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3795/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=728,640,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=3796/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=728,832,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3797/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=729,024,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3798/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=729,216,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3799/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=729,408,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3800/500000]
+ optim/total_grad_norm=1.712
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=729,600,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3801/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=729,792,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3802/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=729,984,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3803/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=730,176,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3804/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=730,368,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3805/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=730,560,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3806/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=730,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3807/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=730,944,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=3808/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=731,136,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=3809/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=731,328,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3810/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=731,520,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3811/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=731,712,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3812/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=731,904,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3813/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=732,096,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3814/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=732,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3815/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=732,480,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3816/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=732,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3817/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=732,864,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3818/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=733,056,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3819/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=733,248,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=3820/500000]
+ optim/total_grad_norm=1.920
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=733,440,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3821/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=733,632,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3822/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=733,824,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3823/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=734,016,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=3824/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=734,208,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=3825/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=734,400,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=3826/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=734,592,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3827/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=734,784,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3828/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=734,976,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3829/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=735,168,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3830/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=735,360,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3831/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=735,552,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3832/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=735,744,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3833/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=735,936,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3834/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=736,128,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3835/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=736,320,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3836/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=736,512,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3837/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=736,704,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3838/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=736,896,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3839/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=737,088,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3840/500000]
+ optim/total_grad_norm=1.548
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=737,280,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3841/500000]
+ train/ActionNoiseL2Loss=0.1762
+ throughput/total_tokens=737,472,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3842/500000]
+ train/ActionNoiseL2Loss=0.1796
+ throughput/total_tokens=737,664,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3843/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=737,856,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3844/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=738,048,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3845/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=738,240,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3846/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=738,432,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3847/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=738,624,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3848/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=738,816,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3849/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=739,008,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3850/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=739,200,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3851/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=739,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3852/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=739,584,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3853/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=739,776,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3854/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=739,968,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3855/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=740,160,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3856/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=740,352,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3857/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=740,544,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3858/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=740,736,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3859/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=740,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3860/500000]
+ optim/total_grad_norm=1.936
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=741,120,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3861/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=741,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3862/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=741,504,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3863/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=741,696,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3864/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=741,888,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3865/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=742,080,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3866/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=742,272,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3867/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=742,464,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3868/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=742,656,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3869/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=742,848,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3870/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=743,040,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3871/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=743,232,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3872/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=743,424,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3873/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=743,616,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3874/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=743,808,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3875/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=744,000,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3876/500000]
+ train/ActionNoiseL2Loss=0.1410
+ throughput/total_tokens=744,192,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3877/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=744,384,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3878/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=744,576,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3879/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=744,768,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3880/500000]
+ optim/total_grad_norm=1.545
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=744,960,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3881/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=745,152,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3882/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=745,344,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3883/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=745,536,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3884/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=745,728,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3885/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=745,920,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3886/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=746,112,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3887/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=746,304,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3888/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=746,496,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3889/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=746,688,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3890/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=746,880,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3891/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=747,072,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3892/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=747,264,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3893/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=747,456,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3894/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=747,648,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3895/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=747,840,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3896/500000]
+ train/ActionNoiseL2Loss=0.1522
+ throughput/total_tokens=748,032,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3897/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=748,224,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3898/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=748,416,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3899/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=748,608,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3900/500000]
+ optim/total_grad_norm=1.217
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=748,800,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=3901/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=748,992,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3902/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=749,184,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3903/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=749,376,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3904/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=749,568,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3905/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=749,760,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3906/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=749,952,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3907/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=750,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3908/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=750,336,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3909/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=750,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3910/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=750,720,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=3911/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=750,912,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3912/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=751,104,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3913/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=751,296,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3914/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=751,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=3915/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=751,680,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3916/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=751,872,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3917/500000]
+ train/ActionNoiseL2Loss=0.1501
+ throughput/total_tokens=752,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3918/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=752,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3919/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=752,448,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=3920/500000]
+ optim/total_grad_norm=1.762
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=752,640,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3921/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=752,832,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3922/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=753,024,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3923/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=753,216,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3924/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=753,408,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3925/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=753,600,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3926/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=753,792,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3927/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=753,984,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3928/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=754,176,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3929/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=754,368,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3930/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=754,560,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3931/500000]
+ train/ActionNoiseL2Loss=0.1577
+ throughput/total_tokens=754,752,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3932/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=754,944,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3933/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=755,136,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3934/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=755,328,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3935/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=755,520,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3936/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=755,712,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3937/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=755,904,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3938/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=756,096,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3939/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=756,288,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3940/500000]
+ optim/total_grad_norm=1.920
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=756,480,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3941/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=756,672,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3942/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=756,864,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3943/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=757,056,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3944/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=757,248,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3945/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=757,440,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3946/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=757,632,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=3947/500000]
+ train/ActionNoiseL2Loss=0.1660
+ throughput/total_tokens=757,824,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3948/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=758,016,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3949/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=758,208,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3950/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=758,400,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3951/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=758,592,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3952/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=758,784,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3953/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=758,976,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3954/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=759,168,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3955/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=759,360,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3956/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=759,552,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3957/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=759,744,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3958/500000]
+ train/ActionNoiseL2Loss=0.1257
+ throughput/total_tokens=759,936,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3959/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=760,128,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3960/500000]
+ optim/total_grad_norm=1.731
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=760,320,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+ System/Peak GPU Memory (MB)=44,547
+[step=3961/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=760,512,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3962/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=760,704,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=3963/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=760,896,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3964/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=761,088,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3965/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=761,280,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3966/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=761,472,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3967/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=761,664,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3968/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=761,856,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3969/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=762,048,000
+ throughput/device/tokens_per_second=1,092
+ throughput/device/batches_per_second=0.0455
+[step=3970/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=762,240,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3971/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=762,432,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3972/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=762,624,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3973/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=762,816,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3974/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=763,008,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3975/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=763,200,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3976/500000]
+ train/ActionNoiseL2Loss=0.1730
+ throughput/total_tokens=763,392,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3977/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=763,584,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3978/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=763,776,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3979/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=763,968,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3980/500000]
+ optim/total_grad_norm=1.707
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=764,160,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3981/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=764,352,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3982/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=764,544,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3983/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=764,736,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3984/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=764,928,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3985/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=765,120,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3986/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=765,312,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3987/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=765,504,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3988/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=765,696,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3989/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=765,888,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=3990/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=766,080,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=3991/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=766,272,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=3992/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=766,464,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3993/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=766,656,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3994/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=766,848,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3995/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=767,040,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3996/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=767,232,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3997/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=767,424,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3998/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=767,616,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=3999/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=767,808,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4000/500000]
+ optim/total_grad_norm=1.948
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=768,000,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+09/29 [11:07:29] INFO | >> Saving config... checkpoint.py:608
+09/29 [11:08:09] INFO | >> Saving model state... checkpoint.py:796
+09/29 [11:09:12] INFO | >> Saving optim state... checkpoint.py:811
+09/29 [11:09:17] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4001/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=768,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4002/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=768,384,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0460
+[step=4003/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=768,576,000
+ throughput/device/tokens_per_second=1,060
+ throughput/device/batches_per_second=0.0442
+[step=4004/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=768,768,000
+ throughput/device/tokens_per_second=1,065
+ throughput/device/batches_per_second=0.0444
+[step=4005/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=768,960,000
+ throughput/device/tokens_per_second=1,075
+ throughput/device/batches_per_second=0.0448
+[step=4006/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=769,152,000
+ throughput/device/tokens_per_second=1,082
+ throughput/device/batches_per_second=0.0451
+[step=4007/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=769,344,000
+ throughput/device/tokens_per_second=1,088
+ throughput/device/batches_per_second=0.0453
+[step=4008/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=769,536,000
+ throughput/device/tokens_per_second=1,091
+ throughput/device/batches_per_second=0.0455
+[step=4009/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=769,728,000
+ throughput/device/tokens_per_second=1,094
+ throughput/device/batches_per_second=0.0456
+[step=4010/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=769,920,000
+ throughput/device/tokens_per_second=1,096
+ throughput/device/batches_per_second=0.0457
+ System/Peak GPU Memory (MB)=44,547
+[step=4011/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=770,112,000
+ throughput/device/tokens_per_second=1,098
+ throughput/device/batches_per_second=0.0458
+[step=4012/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=770,304,000
+ throughput/device/tokens_per_second=1,099
+ throughput/device/batches_per_second=0.0458
+[step=4013/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=770,496,000
+ throughput/device/tokens_per_second=1,101
+ throughput/device/batches_per_second=0.0459
+[step=4014/500000]
+ train/ActionNoiseL2Loss=0.1588
+ throughput/total_tokens=770,688,000
+ throughput/device/tokens_per_second=1,102
+ throughput/device/batches_per_second=0.0459
+[step=4015/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=770,880,000
+ throughput/device/tokens_per_second=1,103
+ throughput/device/batches_per_second=0.0460
+[step=4016/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=771,072,000
+ throughput/device/tokens_per_second=1,104
+ throughput/device/batches_per_second=0.0460
+[step=4017/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=771,264,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0460
+[step=4018/500000]
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=771,456,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=4019/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=771,648,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=4020/500000]
+ optim/total_grad_norm=1.800
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=771,840,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,547
+[step=4021/500000]
+ train/ActionNoiseL2Loss=0.1747
+ throughput/total_tokens=772,032,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=4022/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=772,224,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4023/500000]
+ train/ActionNoiseL2Loss=0.1425
+ throughput/total_tokens=772,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4024/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=772,608,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4025/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=772,800,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4026/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=772,992,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4027/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=773,184,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4028/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=773,376,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4029/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=773,568,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4030/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=773,760,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4031/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=773,952,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4032/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=774,144,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4033/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=774,336,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4034/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=774,528,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4035/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=774,720,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4036/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=774,912,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4037/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=775,104,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4038/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=775,296,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4039/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=775,488,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4040/500000]
+ optim/total_grad_norm=1.776
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=775,680,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4041/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=775,872,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4042/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=776,064,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4043/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=776,256,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4044/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=776,448,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4045/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=776,640,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4046/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=776,832,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4047/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=777,024,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4048/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=777,216,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4049/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=777,408,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4050/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=777,600,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4051/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=777,792,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4052/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=777,984,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4053/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=778,176,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4054/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=778,368,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4055/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=778,560,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4056/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=778,752,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4057/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=778,944,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4058/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=779,136,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4059/500000]
+ train/ActionNoiseL2Loss=0.1483
+ throughput/total_tokens=779,328,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4060/500000]
+ optim/total_grad_norm=2.129
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=779,520,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=4061/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=779,712,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4062/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=779,904,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4063/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=780,096,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4064/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=780,288,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4065/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=780,480,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4066/500000]
+ train/ActionNoiseL2Loss=0.1630
+ throughput/total_tokens=780,672,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4067/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=780,864,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4068/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=781,056,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4069/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=781,248,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4070/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=781,440,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4071/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=781,632,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4072/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=781,824,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4073/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=782,016,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4074/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=782,208,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4075/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=782,400,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4076/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=782,592,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4077/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=782,784,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4078/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=782,976,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4079/500000]
+ train/ActionNoiseL2Loss=0.1534
+ throughput/total_tokens=783,168,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4080/500000]
+ optim/total_grad_norm=1.947
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=783,360,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4081/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=783,552,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4082/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=783,744,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4083/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=783,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4084/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=784,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4085/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=784,320,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4086/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=784,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4087/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=784,704,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4088/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=784,896,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4089/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=785,088,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4090/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=785,280,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4091/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=785,472,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4092/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=785,664,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4093/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=785,856,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4094/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=786,048,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4095/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=786,240,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4096/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=786,432,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4097/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=786,624,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4098/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=786,816,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4099/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=787,008,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4100/500000]
+ optim/total_grad_norm=1.441
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=787,200,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4101/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=787,392,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4102/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=787,584,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4103/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=787,776,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4104/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=787,968,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4105/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=788,160,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4106/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=788,352,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4107/500000]
+ train/ActionNoiseL2Loss=0.1556
+ throughput/total_tokens=788,544,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4108/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=788,736,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4109/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=788,928,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4110/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=789,120,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4111/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=789,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4112/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=789,504,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4113/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=789,696,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4114/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=789,888,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4115/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=790,080,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4116/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=790,272,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4117/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=790,464,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4118/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=790,656,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4119/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=790,848,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4120/500000]
+ optim/total_grad_norm=2.855
+ train/ActionNoiseL2Loss=0.2254
+ throughput/total_tokens=791,040,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4121/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=791,232,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4122/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=791,424,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4123/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=791,616,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4124/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=791,808,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4125/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=792,000,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4126/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=792,192,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4127/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=792,384,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4128/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=792,576,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4129/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=792,768,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4130/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=792,960,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4131/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=793,152,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4132/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=793,344,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4133/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=793,536,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4134/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=793,728,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4135/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=793,920,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4136/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=794,112,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4137/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=794,304,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4138/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=794,496,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4139/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=794,688,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4140/500000]
+ optim/total_grad_norm=1.323
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=794,880,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4141/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=795,072,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4142/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=795,264,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4143/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=795,456,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4144/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=795,648,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4145/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=795,840,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4146/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=796,032,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4147/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=796,224,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4148/500000]
+ train/ActionNoiseL2Loss=0.1585
+ throughput/total_tokens=796,416,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4149/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=796,608,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4150/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=796,800,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4151/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=796,992,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4152/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=797,184,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4153/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=797,376,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4154/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=797,568,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4155/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=797,760,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4156/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=797,952,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4157/500000]
+ train/ActionNoiseL2Loss=0.1435
+ throughput/total_tokens=798,144,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4158/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=798,336,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4159/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=798,528,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4160/500000]
+ optim/total_grad_norm=1.600
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=798,720,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=4161/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=798,912,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4162/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=799,104,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4163/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=799,296,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=4164/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=799,488,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4165/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=799,680,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4166/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=799,872,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4167/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=800,064,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4168/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=800,256,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4169/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=800,448,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4170/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=800,640,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4171/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=800,832,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4172/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=801,024,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4173/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=801,216,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4174/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=801,408,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4175/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=801,600,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4176/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=801,792,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4177/500000]
+ train/ActionNoiseL2Loss=0.1759
+ throughput/total_tokens=801,984,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4178/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=802,176,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4179/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=802,368,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4180/500000]
+ optim/total_grad_norm=1.617
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=802,560,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4181/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=802,752,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4182/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=802,944,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4183/500000]
+ train/ActionNoiseL2Loss=0.1571
+ throughput/total_tokens=803,136,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4184/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=803,328,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4185/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=803,520,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4186/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=803,712,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4187/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=803,904,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4188/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=804,096,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4189/500000]
+ train/ActionNoiseL2Loss=0.1904
+ throughput/total_tokens=804,288,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4190/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=804,480,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4191/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=804,672,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4192/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=804,864,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4193/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=805,056,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4194/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=805,248,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4195/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=805,440,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4196/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=805,632,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4197/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=805,824,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4198/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=806,016,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4199/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=806,208,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4200/500000]
+ optim/total_grad_norm=1.700
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=806,400,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4201/500000]
+ train/ActionNoiseL2Loss=0.2001
+ throughput/total_tokens=806,592,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4202/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=806,784,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4203/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=806,976,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4204/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=807,168,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4205/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=807,360,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4206/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=807,552,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4207/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=807,744,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4208/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=807,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4209/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=808,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4210/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=808,320,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4211/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=808,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4212/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=808,704,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4213/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=808,896,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4214/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=809,088,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4215/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=809,280,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4216/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=809,472,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4217/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=809,664,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4218/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=809,856,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4219/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=810,048,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4220/500000]
+ optim/total_grad_norm=1.399
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=810,240,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4221/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=810,432,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4222/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=810,624,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4223/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=810,816,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4224/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=811,008,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4225/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=811,200,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4226/500000]
+ train/ActionNoiseL2Loss=0.1479
+ throughput/total_tokens=811,392,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4227/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=811,584,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4228/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=811,776,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4229/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=811,968,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4230/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=812,160,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4231/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=812,352,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4232/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=812,544,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4233/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=812,736,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4234/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=812,928,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4235/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=813,120,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4236/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=813,312,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4237/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=813,504,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4238/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=813,696,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4239/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=813,888,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4240/500000]
+ optim/total_grad_norm=2.198
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=814,080,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4241/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=814,272,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4242/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=814,464,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4243/500000]
+ train/ActionNoiseL2Loss=0.2140
+ throughput/total_tokens=814,656,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4244/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=814,848,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4245/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=815,040,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4246/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=815,232,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4247/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=815,424,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4248/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=815,616,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4249/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=815,808,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4250/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=816,000,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4251/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=816,192,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4252/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=816,384,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4253/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=816,576,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4254/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=816,768,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=4255/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=816,960,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4256/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=817,152,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4257/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=817,344,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=4258/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=817,536,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4259/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=817,728,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4260/500000]
+ optim/total_grad_norm=1.944
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=817,920,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4261/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=818,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4262/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=818,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4263/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=818,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4264/500000]
+ train/ActionNoiseL2Loss=0.1792
+ throughput/total_tokens=818,688,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4265/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=818,880,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4266/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=819,072,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4267/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=819,264,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4268/500000]
+ train/ActionNoiseL2Loss=0.1255
+ throughput/total_tokens=819,456,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4269/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=819,648,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4270/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=819,840,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4271/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=820,032,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4272/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=820,224,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4273/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=820,416,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4274/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=820,608,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4275/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=820,800,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4276/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=820,992,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4277/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=821,184,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4278/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=821,376,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4279/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=821,568,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4280/500000]
+ optim/total_grad_norm=2.310
+ train/ActionNoiseL2Loss=0.1559
+ throughput/total_tokens=821,760,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4281/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=821,952,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4282/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=822,144,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4283/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=822,336,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4284/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=822,528,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4285/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=822,720,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4286/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=822,912,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4287/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=823,104,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=4288/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=823,296,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4289/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=823,488,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=4290/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=823,680,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=4291/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=823,872,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4292/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=824,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4293/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=824,256,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4294/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=824,448,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4295/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=824,640,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4296/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=824,832,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4297/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=825,024,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4298/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=825,216,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4299/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=825,408,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4300/500000]
+ optim/total_grad_norm=1.920
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=825,600,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4301/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=825,792,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4302/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=825,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4303/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=826,176,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4304/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=826,368,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4305/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=826,560,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4306/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=826,752,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4307/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=826,944,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4308/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=827,136,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4309/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=827,328,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4310/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=827,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4311/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=827,712,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4312/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=827,904,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4313/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=828,096,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4314/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=828,288,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4315/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=828,480,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4316/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=828,672,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4317/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=828,864,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4318/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=829,056,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4319/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=829,248,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4320/500000]
+ optim/total_grad_norm=1.506
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=829,440,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=4321/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=829,632,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4322/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=829,824,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4323/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=830,016,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4324/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=830,208,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4325/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=830,400,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4326/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=830,592,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4327/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=830,784,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4328/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=830,976,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4329/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=831,168,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4330/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=831,360,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=4331/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=831,552,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4332/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=831,744,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4333/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=831,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4334/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=832,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4335/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=832,320,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4336/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=832,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4337/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=832,704,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4338/500000]
+ train/ActionNoiseL2Loss=0.1425
+ throughput/total_tokens=832,896,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4339/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=833,088,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4340/500000]
+ optim/total_grad_norm=2.257
+ train/ActionNoiseL2Loss=0.1526
+ throughput/total_tokens=833,280,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4341/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=833,472,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4342/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=833,664,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4343/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=833,856,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4344/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=834,048,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4345/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=834,240,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4346/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=834,432,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4347/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=834,624,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4348/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=834,816,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4349/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=835,008,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=4350/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=835,200,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=4351/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=835,392,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4352/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=835,584,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4353/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=835,776,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4354/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=835,968,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4355/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=836,160,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4356/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=836,352,000
+ throughput/device/tokens_per_second=1,110
+ throughput/device/batches_per_second=0.0463
+[step=4357/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=836,544,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4358/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=836,736,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=4359/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=836,928,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+[step=4360/500000]
+ optim/total_grad_norm=1.723
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=837,120,000
+ throughput/device/tokens_per_second=1,105
+ throughput/device/batches_per_second=0.0461
+ System/Peak GPU Memory (MB)=44,547
+[step=4361/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=837,312,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=4362/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=837,504,000
+ throughput/device/tokens_per_second=1,106
+ throughput/device/batches_per_second=0.0461
+[step=4363/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=837,696,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4364/500000]
+ train/ActionNoiseL2Loss=0.1500
+ throughput/total_tokens=837,888,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4365/500000]
+ train/ActionNoiseL2Loss=0.1794
+ throughput/total_tokens=838,080,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=4366/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=838,272,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=4367/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=838,464,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4368/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=838,656,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4369/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=838,848,000
+ throughput/device/tokens_per_second=1,111
+ throughput/device/batches_per_second=0.0463
+[step=4370/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=839,040,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=4371/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=839,232,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4372/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=839,424,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4373/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=839,616,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4374/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=839,808,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4375/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=840,000,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4376/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=840,192,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4377/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=840,384,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4378/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=840,576,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4379/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=840,768,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4380/500000]
+ optim/total_grad_norm=1.908
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=840,960,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4381/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=841,152,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4382/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=841,344,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4383/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=841,536,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4384/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=841,728,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4385/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=841,920,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4386/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=842,112,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4387/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=842,304,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4388/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=842,496,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4389/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=842,688,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4390/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=842,880,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4391/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=843,072,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4392/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=843,264,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4393/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=843,456,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4394/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=843,648,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4395/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=843,840,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4396/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=844,032,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4397/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=844,224,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4398/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=844,416,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4399/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=844,608,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4400/500000]
+ optim/total_grad_norm=1.828
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=844,800,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4401/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=844,992,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4402/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=845,184,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4403/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=845,376,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4404/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=845,568,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4405/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=845,760,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4406/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=845,952,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4407/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=846,144,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4408/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=846,336,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4409/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=846,528,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4410/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=846,720,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4411/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=846,912,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4412/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=847,104,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4413/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=847,296,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4414/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=847,488,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4415/500000]
+ train/ActionNoiseL2Loss=0.1316
+ throughput/total_tokens=847,680,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4416/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=847,872,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4417/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=848,064,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4418/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=848,256,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4419/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=848,448,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4420/500000]
+ optim/total_grad_norm=1.682
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=848,640,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4421/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=848,832,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4422/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=849,024,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4423/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=849,216,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4424/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=849,408,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4425/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=849,600,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4426/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=849,792,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4427/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=849,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4428/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=850,176,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4429/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=850,368,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4430/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=850,560,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4431/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=850,752,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4432/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=850,944,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4433/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=851,136,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4434/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=851,328,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4435/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=851,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4436/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=851,712,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4437/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=851,904,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4438/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=852,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4439/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=852,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4440/500000]
+ optim/total_grad_norm=2.110
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=852,480,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4441/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=852,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4442/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=852,864,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4443/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=853,056,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4444/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=853,248,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4445/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=853,440,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4446/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=853,632,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4447/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=853,824,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4448/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=854,016,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4449/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=854,208,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4450/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=854,400,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4451/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=854,592,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4452/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=854,784,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4453/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=854,976,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4454/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=855,168,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4455/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=855,360,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4456/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=855,552,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4457/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=855,744,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4458/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=855,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4459/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=856,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4460/500000]
+ optim/total_grad_norm=1.417
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=856,320,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4461/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=856,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4462/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=856,704,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4463/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=856,896,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4464/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=857,088,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4465/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=857,280,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4466/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=857,472,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4467/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=857,664,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4468/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=857,856,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4469/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=858,048,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4470/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=858,240,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4471/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=858,432,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4472/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=858,624,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4473/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=858,816,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4474/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=859,008,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4475/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=859,200,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4476/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=859,392,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4477/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=859,584,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4478/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=859,776,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4479/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=859,968,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4480/500000]
+ optim/total_grad_norm=1.325
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=860,160,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4481/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=860,352,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4482/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=860,544,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4483/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=860,736,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4484/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=860,928,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4485/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=861,120,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4486/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=861,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4487/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=861,504,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=4488/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=861,696,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=4489/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=861,888,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=4490/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=862,080,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+ System/Peak GPU Memory (MB)=44,547
+[step=4491/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=862,272,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0464
+[step=4492/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=862,464,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+[step=4493/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=862,656,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4494/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=862,848,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4495/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=863,040,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4496/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=863,232,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4497/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=863,424,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4498/500000]
+ train/ActionNoiseL2Loss=0.1585
+ throughput/total_tokens=863,616,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4499/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=863,808,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4500/500000]
+ optim/total_grad_norm=2.054
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=864,000,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,547
+09/29 [14:09:40] INFO | >> Saving config... checkpoint.py:608
+09/29 [14:10:12] INFO | >> Saving model state... checkpoint.py:796
+09/29 [14:11:15] INFO | >> Saving optim state... checkpoint.py:811
+09/29 [14:11:20] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4501/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=864,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4502/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=864,384,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=4503/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=864,576,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=4504/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=864,768,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=4505/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=864,960,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=4506/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=865,152,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=4507/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=865,344,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=4508/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=865,536,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=4509/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=865,728,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=4510/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=865,920,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4511/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=866,112,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=4512/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=866,304,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=4513/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=866,496,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4514/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=866,688,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4515/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=866,880,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4516/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=867,072,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4517/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=867,264,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4518/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=867,456,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4519/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=867,648,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4520/500000]
+ optim/total_grad_norm=1.324
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=867,840,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4521/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=868,032,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4522/500000]
+ train/ActionNoiseL2Loss=0.1271
+ throughput/total_tokens=868,224,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4523/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=868,416,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4524/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=868,608,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4525/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=868,800,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4526/500000]
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=868,992,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4527/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=869,184,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4528/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=869,376,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4529/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=869,568,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4530/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=869,760,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4531/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=869,952,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4532/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=870,144,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4533/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=870,336,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4534/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=870,528,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4535/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=870,720,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4536/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=870,912,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4537/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=871,104,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4538/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=871,296,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4539/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=871,488,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4540/500000]
+ optim/total_grad_norm=1.813
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=871,680,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4541/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=871,872,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4542/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=872,064,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4543/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=872,256,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4544/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=872,448,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4545/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=872,640,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4546/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=872,832,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4547/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=873,024,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4548/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=873,216,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4549/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=873,408,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4550/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=873,600,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4551/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=873,792,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4552/500000]
+ train/ActionNoiseL2Loss=0.1610
+ throughput/total_tokens=873,984,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4553/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=874,176,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4554/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=874,368,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4555/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=874,560,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4556/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=874,752,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4557/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=874,944,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4558/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=875,136,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4559/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=875,328,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4560/500000]
+ optim/total_grad_norm=1.451
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=875,520,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4561/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=875,712,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4562/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=875,904,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4563/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=876,096,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4564/500000]
+ train/ActionNoiseL2Loss=0.1643
+ throughput/total_tokens=876,288,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4565/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=876,480,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4566/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=876,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4567/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=876,864,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4568/500000]
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=877,056,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4569/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=877,248,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4570/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=877,440,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4571/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=877,632,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4572/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=877,824,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4573/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=878,016,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4574/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=878,208,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4575/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=878,400,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4576/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=878,592,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4577/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=878,784,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4578/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=878,976,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4579/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=879,168,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4580/500000]
+ optim/total_grad_norm=1.211
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=879,360,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4581/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=879,552,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4582/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=879,744,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4583/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=879,936,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4584/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=880,128,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4585/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=880,320,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4586/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=880,512,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4587/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=880,704,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4588/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=880,896,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4589/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=881,088,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4590/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=881,280,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4591/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=881,472,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4592/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=881,664,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4593/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=881,856,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4594/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=882,048,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4595/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=882,240,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4596/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=882,432,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4597/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=882,624,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4598/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=882,816,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4599/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=883,008,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4600/500000]
+ optim/total_grad_norm=1.372
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=883,200,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4601/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=883,392,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4602/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=883,584,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4603/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=883,776,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4604/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=883,968,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4605/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=884,160,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4606/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=884,352,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4607/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=884,544,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4608/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=884,736,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4609/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=884,928,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4610/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=885,120,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4611/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=885,312,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4612/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=885,504,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4613/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=885,696,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4614/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=885,888,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4615/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=886,080,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4616/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=886,272,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4617/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=886,464,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4618/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=886,656,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4619/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=886,848,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4620/500000]
+ optim/total_grad_norm=1.493
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=887,040,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4621/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=887,232,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4622/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=887,424,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4623/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=887,616,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4624/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=887,808,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4625/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=888,000,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4626/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=888,192,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4627/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=888,384,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4628/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=888,576,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4629/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=888,768,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4630/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=888,960,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4631/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=889,152,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4632/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=889,344,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4633/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=889,536,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4634/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=889,728,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4635/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=889,920,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4636/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=890,112,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4637/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=890,304,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4638/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=890,496,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4639/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=890,688,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4640/500000]
+ optim/total_grad_norm=1.899
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=890,880,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4641/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=891,072,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4642/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=891,264,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4643/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=891,456,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4644/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=891,648,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4645/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=891,840,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4646/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=892,032,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4647/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=892,224,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4648/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=892,416,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4649/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=892,608,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4650/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=892,800,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4651/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=892,992,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4652/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=893,184,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=4653/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=893,376,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4654/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=893,568,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4655/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=893,760,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4656/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=893,952,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4657/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=894,144,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4658/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=894,336,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4659/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=894,528,000
+ throughput/device/tokens_per_second=1,109
+ throughput/device/batches_per_second=0.0462
+[step=4660/500000]
+ optim/total_grad_norm=2.136
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=894,720,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+ System/Peak GPU Memory (MB)=44,547
+[step=4661/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=894,912,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4662/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=895,104,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4663/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=895,296,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4664/500000]
+ train/ActionNoiseL2Loss=0.2168
+ throughput/total_tokens=895,488,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4665/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=895,680,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4666/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=895,872,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4667/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=896,064,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4668/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=896,256,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4669/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=896,448,000
+ throughput/device/tokens_per_second=1,108
+ throughput/device/batches_per_second=0.0462
+[step=4670/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=896,640,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0463
+ System/Peak GPU Memory (MB)=44,547
+[step=4671/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=896,832,000
+ throughput/device/tokens_per_second=1,112
+ throughput/device/batches_per_second=0.0464
+[step=4672/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=897,024,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4673/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=897,216,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4674/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=897,408,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4675/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=897,600,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4676/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=897,792,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4677/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=897,984,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4678/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=898,176,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4679/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=898,368,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4680/500000]
+ optim/total_grad_norm=1.523
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=898,560,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4681/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=898,752,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4682/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=898,944,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4683/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=899,136,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4684/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=899,328,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4685/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=899,520,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4686/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=899,712,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4687/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=899,904,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4688/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=900,096,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4689/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=900,288,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4690/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=900,480,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4691/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=900,672,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4692/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=900,864,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4693/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=901,056,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4694/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=901,248,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4695/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=901,440,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4696/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=901,632,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4697/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=901,824,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4698/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=902,016,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4699/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=902,208,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4700/500000]
+ optim/total_grad_norm=1.680
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=902,400,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4701/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=902,592,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4702/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=902,784,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4703/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=902,976,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4704/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=903,168,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4705/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=903,360,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4706/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=903,552,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4707/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=903,744,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4708/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=903,936,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4709/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=904,128,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4710/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=904,320,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4711/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=904,512,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4712/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=904,704,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4713/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=904,896,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4714/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=905,088,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4715/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=905,280,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4716/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=905,472,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4717/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=905,664,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4718/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=905,856,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4719/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=906,048,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4720/500000]
+ optim/total_grad_norm=2.164
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=906,240,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4721/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=906,432,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4722/500000]
+ train/ActionNoiseL2Loss=0.1447
+ throughput/total_tokens=906,624,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4723/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=906,816,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4724/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=907,008,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4725/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=907,200,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4726/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=907,392,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4727/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=907,584,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4728/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=907,776,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4729/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=907,968,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4730/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=908,160,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4731/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=908,352,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4732/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=908,544,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4733/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=908,736,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4734/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=908,928,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4735/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=909,120,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4736/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=909,312,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4737/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=909,504,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4738/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=909,696,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4739/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=909,888,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4740/500000]
+ optim/total_grad_norm=1.558
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=910,080,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4741/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=910,272,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4742/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=910,464,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4743/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=910,656,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4744/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=910,848,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4745/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=911,040,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4746/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=911,232,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4747/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=911,424,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4748/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=911,616,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4749/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=911,808,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4750/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=912,000,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4751/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=912,192,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4752/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=912,384,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4753/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=912,576,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4754/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=912,768,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4755/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=912,960,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4756/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=913,152,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4757/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=913,344,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4758/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=913,536,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4759/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=913,728,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4760/500000]
+ optim/total_grad_norm=1.695
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=913,920,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4761/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=914,112,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4762/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=914,304,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4763/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=914,496,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4764/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=914,688,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4765/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=914,880,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4766/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=915,072,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4767/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=915,264,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4768/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=915,456,000
+ throughput/device/tokens_per_second=1,115
+ throughput/device/batches_per_second=0.0465
+[step=4769/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=915,648,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4770/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=915,840,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4771/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=916,032,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4772/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=916,224,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4773/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=916,416,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4774/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=916,608,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4775/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=916,800,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4776/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=916,992,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4777/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=917,184,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4778/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=917,376,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4779/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=917,568,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4780/500000]
+ optim/total_grad_norm=2.712
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=917,760,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4781/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=917,952,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4782/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=918,144,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4783/500000]
+ train/ActionNoiseL2Loss=0.1682
+ throughput/total_tokens=918,336,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4784/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=918,528,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4785/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=918,720,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4786/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=918,912,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4787/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=919,104,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4788/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=919,296,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4789/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=919,488,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4790/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=919,680,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4791/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=919,872,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4792/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=920,064,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4793/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=920,256,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4794/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=920,448,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4795/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=920,640,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4796/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=920,832,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4797/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=921,024,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4798/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=921,216,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4799/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=921,408,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4800/500000]
+ optim/total_grad_norm=1.784
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=921,600,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4801/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=921,792,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4802/500000]
+ train/ActionNoiseL2Loss=0.1945
+ throughput/total_tokens=921,984,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4803/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=922,176,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4804/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=922,368,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4805/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=922,560,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4806/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=922,752,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4807/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=922,944,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4808/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=923,136,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4809/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=923,328,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4810/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=923,520,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4811/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=923,712,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4812/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=923,904,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4813/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=924,096,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4814/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=924,288,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4815/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=924,480,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4816/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=924,672,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4817/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=924,864,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4818/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=925,056,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4819/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=925,248,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4820/500000]
+ optim/total_grad_norm=1.701
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=925,440,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4821/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=925,632,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4822/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=925,824,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4823/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=926,016,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4824/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=926,208,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4825/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=926,400,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4826/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=926,592,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4827/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=926,784,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4828/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=926,976,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4829/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=927,168,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4830/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=927,360,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4831/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=927,552,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4832/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=927,744,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4833/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=927,936,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4834/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=928,128,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4835/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=928,320,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4836/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=928,512,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4837/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=928,704,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4838/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=928,896,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4839/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=929,088,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4840/500000]
+ optim/total_grad_norm=1.253
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=929,280,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4841/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=929,472,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4842/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=929,664,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4843/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=929,856,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4844/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=930,048,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4845/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=930,240,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4846/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=930,432,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4847/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=930,624,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4848/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=930,816,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4849/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=931,008,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4850/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=931,200,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4851/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=931,392,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4852/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=931,584,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4853/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=931,776,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4854/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=931,968,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4855/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=932,160,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4856/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=932,352,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4857/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=932,544,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4858/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=932,736,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4859/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=932,928,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4860/500000]
+ optim/total_grad_norm=2.405
+ train/ActionNoiseL2Loss=0.1906
+ throughput/total_tokens=933,120,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4861/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=933,312,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4862/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=933,504,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4863/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=933,696,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4864/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=933,888,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4865/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=934,080,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4866/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=934,272,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4867/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=934,464,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4868/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=934,656,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4869/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=934,848,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4870/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=935,040,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4871/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=935,232,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4872/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=935,424,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4873/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=935,616,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4874/500000]
+ train/ActionNoiseL2Loss=0.2132
+ throughput/total_tokens=935,808,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4875/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=936,000,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4876/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=936,192,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4877/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=936,384,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4878/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=936,576,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4879/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=936,768,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4880/500000]
+ optim/total_grad_norm=0.9752
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=936,960,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4881/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=937,152,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4882/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=937,344,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4883/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=937,536,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4884/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=937,728,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4885/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=937,920,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4886/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=938,112,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4887/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=938,304,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4888/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=938,496,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4889/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=938,688,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4890/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=938,880,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4891/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=939,072,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4892/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=939,264,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4893/500000]
+ train/ActionNoiseL2Loss=0.1629
+ throughput/total_tokens=939,456,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4894/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=939,648,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4895/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=939,840,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4896/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=940,032,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4897/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=940,224,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4898/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=940,416,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4899/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=940,608,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4900/500000]
+ optim/total_grad_norm=1.153
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=940,800,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4901/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=940,992,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4902/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=941,184,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4903/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=941,376,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4904/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=941,568,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4905/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=941,760,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4906/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=941,952,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4907/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=942,144,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4908/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=942,336,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4909/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=942,528,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4910/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=942,720,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+ System/Peak GPU Memory (MB)=44,547
+[step=4911/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=942,912,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4912/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=943,104,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4913/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=943,296,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4914/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=943,488,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4915/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=943,680,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4916/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=943,872,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4917/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=944,064,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4918/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=944,256,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4919/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=944,448,000
+ throughput/device/tokens_per_second=1,116
+ throughput/device/batches_per_second=0.0465
+[step=4920/500000]
+ optim/total_grad_norm=1.281
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=944,640,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4921/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=944,832,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4922/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=945,024,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4923/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=945,216,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4924/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=945,408,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0466
+[step=4925/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=945,600,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4926/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=945,792,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4927/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=945,984,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4928/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=946,176,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4929/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=946,368,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4930/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=946,560,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4931/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=946,752,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4932/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=946,944,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4933/500000]
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=947,136,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4934/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=947,328,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4935/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=947,520,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4936/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=947,712,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4937/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=947,904,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4938/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=948,096,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4939/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=948,288,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4940/500000]
+ optim/total_grad_norm=1.708
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=948,480,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4941/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=948,672,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4942/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=948,864,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4943/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=949,056,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4944/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=949,248,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4945/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=949,440,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4946/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=949,632,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4947/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=949,824,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4948/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=950,016,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4949/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=950,208,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+[step=4950/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=950,400,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4951/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=950,592,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4952/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=950,784,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4953/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=950,976,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4954/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=951,168,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4955/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=951,360,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4956/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=951,552,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4957/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=951,744,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4958/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=951,936,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4959/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=952,128,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4960/500000]
+ optim/total_grad_norm=2.039
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=952,320,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+ System/Peak GPU Memory (MB)=44,547
+[step=4961/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=952,512,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4962/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=952,704,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4963/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=952,896,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4964/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=953,088,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4965/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=953,280,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4966/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=953,472,000
+ throughput/device/tokens_per_second=1,118
+ throughput/device/batches_per_second=0.0466
+[step=4967/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=953,664,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4968/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=953,856,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=4969/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=954,048,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0465
+[step=4970/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=954,240,000
+ throughput/device/tokens_per_second=1,120
+ throughput/device/batches_per_second=0.0467
+ System/Peak GPU Memory (MB)=44,547
+[step=4971/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=954,432,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4972/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=954,624,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4973/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=954,816,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
+[step=4974/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=955,008,000
+ throughput/device/tokens_per_second=1,119
+ throughput/device/batches_per_second=0.0467
diff --git a/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/requirements.txt b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..291a344502cb68f8ac9dcf95e2d7e2df5f47b9b6
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/requirements.txt
@@ -0,0 +1,284 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/wandb-metadata.json b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..9a27a72e006494e9496d08d14f3567f3020d734c
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-09-28T10:46:55.598253Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "1600",
+ "--lora_rank",
+ "32",
+ "--lora_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "4bc163cc0eab3abc66a1d330d90c6009d30eb98e"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/wandb",
+ "host": "auh7-1b-gpu-292",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50808598528"
+ }
+ },
+ "memory": {
+ "total": "2434606923776"
+ },
+ "gpu_amd": [
+ {
+ "id": "2",
+ "uniqueId": "0x2a954aa975e59d15",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xad1bf75f50313455",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0xbabaa83bdb6fe877",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0x333c966d5f3b3375",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0xc6ed7c5159e83b1",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x5656afec2788d569",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0xa95e252cd7a6e54e",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xdee6d87744a36ae",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1759315545",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "1796",
+ "job_name": "realworld_mh",
+ "job_nodelist": "auh7-1b-gpu-292",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1759056345",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "1796",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-292",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "1094895",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-292",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "iqipvq7mbtgd8qiqhzdhnaaxotwr4cda"
+}
\ No newline at end of file
diff --git a/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/logs/debug-core.log b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..fa15fb7e5064687244d47997aa26f940064b1edb
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/logs/debug-core.log
@@ -0,0 +1,6 @@
+{"time":"2025-09-28T10:46:55.841115783Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpsl8k30de/port-1095073.txt","pid":1095073,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-09-28T10:46:55.842830172Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":1095073}
+{"time":"2025-09-28T10:46:55.843998872Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-1095073-1095474-3931118195/socket","Net":"unix"}}
+{"time":"2025-09-28T10:46:55.846183139Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-09-28T10:46:55.861688513Z","level":"INFO","msg":"handleInformInit: received","streamId":"3b31u4we","id":"1(@)"}
+{"time":"2025-09-28T10:46:57.115500269Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"3b31u4we","id":"1(@)"}
diff --git a/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/logs/debug-internal.log b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..112205f5758dea622258c88ab58ad09bc08afda6
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/logs/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-09-28T10:46:55.863725767Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-09-28T10:46:57.115450508Z","level":"INFO","msg":"stream: created new stream","id":"3b31u4we"}
+{"time":"2025-09-28T10:46:57.115494559Z","level":"INFO","msg":"stream: started","id":"3b31u4we"}
+{"time":"2025-09-28T10:46:57.115514719Z","level":"INFO","msg":"handler: started","stream_id":"3b31u4we"}
+{"time":"2025-09-28T10:46:57.115518199Z","level":"INFO","msg":"writer: started","stream_id":"3b31u4we"}
+{"time":"2025-09-28T10:46:57.11554652Z","level":"INFO","msg":"sender: started","stream_id":"3b31u4we"}
diff --git a/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/logs/debug.log b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/run-3b31u4we.wandb b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/run-3b31u4we.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..1cdb38518f449bdc5d92869ee32f96b154182a1c
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20250928_104655-3b31u4we/run-3b31u4we.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c44d9fd8f59982bceb2465e994691fb74dbc5bdc54be7b059019fcfa7eec52a0
+size 367591424
diff --git a/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/output.log b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..6aa0faf517dc21e6c9d8557e3ce404f3fbc39deb
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/output.log
@@ -0,0 +1,63018 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+10/02 [16:45:40] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk', 1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk50', 1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Eraser', 1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue', 1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Pen', 1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_StickyNote', 1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Test_Glue', 1, 'bounds'], ['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Wipe', 1, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+10/02 [16:45:46] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130
+10/02 [16:45:47] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk
+****** length of the dataset: 72641
+10/02 [16:45:55] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk50
+****** length of the dataset: 27906
+10/02 [16:45:58] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Eraser
+****** length of the dataset: 13441
+10/02 [16:45:59] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+****** length of the dataset: 10316
+10/02 [16:46:00] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Pen
+****** length of the dataset: 17131
+10/02 [16:46:01] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_StickyNote
+****** length of the dataset: 15765
+10/02 [16:46:02] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Test_Glue
+****** length of the dataset: 90
+10/02 [16:46:03] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Wipe
+****** length of the dataset: 18397
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: [, , , , , , , ]
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+10/02 [16:46:04] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=False, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* After get lora params successfully
+10/02 [16:47:22] INFO | >> Constructing optimizer with 2 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 36856
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=36,856
+10/02 [16:47:23] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+10/02 [16:47:30] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109
+ of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed
+ want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor
+ by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered
+ internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.)
+ param_grad = param.grad
+
+[step=1/500000]
+ train/ActionNoiseL2Loss=1.751
+ throughput/total_tokens=192,000
+ System/Peak GPU Memory (MB)=39,644
+[step=2/500000]
+ train/ActionNoiseL2Loss=1.716
+ throughput/total_tokens=384,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+ System/Peak GPU Memory (MB)=46,466
+[step=3/500000]
+ train/ActionNoiseL2Loss=1.791
+ throughput/total_tokens=576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4/500000]
+ train/ActionNoiseL2Loss=1.797
+ throughput/total_tokens=768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5/500000]
+ train/ActionNoiseL2Loss=1.626
+ throughput/total_tokens=960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6/500000]
+ train/ActionNoiseL2Loss=1.587
+ throughput/total_tokens=1,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7/500000]
+ train/ActionNoiseL2Loss=1.715
+ throughput/total_tokens=1,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8/500000]
+ train/ActionNoiseL2Loss=1.611
+ throughput/total_tokens=1,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9/500000]
+ train/ActionNoiseL2Loss=1.500
+ throughput/total_tokens=1,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10/500000]
+ train/ActionNoiseL2Loss=1.526
+ throughput/total_tokens=1,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=11/500000]
+ train/ActionNoiseL2Loss=1.508
+ throughput/total_tokens=2,112,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=12/500000]
+ train/ActionNoiseL2Loss=1.489
+ throughput/total_tokens=2,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=13/500000]
+ train/ActionNoiseL2Loss=1.390
+ throughput/total_tokens=2,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=14/500000]
+ train/ActionNoiseL2Loss=1.480
+ throughput/total_tokens=2,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=15/500000]
+ train/ActionNoiseL2Loss=1.424
+ throughput/total_tokens=2,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=16/500000]
+ train/ActionNoiseL2Loss=1.579
+ throughput/total_tokens=3,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=17/500000]
+ train/ActionNoiseL2Loss=1.399
+ throughput/total_tokens=3,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=18/500000]
+ train/ActionNoiseL2Loss=1.477
+ throughput/total_tokens=3,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=19/500000]
+ train/ActionNoiseL2Loss=1.379
+ throughput/total_tokens=3,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=20/500000]
+ optim/total_grad_norm=15.52
+ train/ActionNoiseL2Loss=1.344
+ throughput/total_tokens=3,840,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=21/500000]
+ train/ActionNoiseL2Loss=1.507
+ throughput/total_tokens=4,032,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=22/500000]
+ train/ActionNoiseL2Loss=1.337
+ throughput/total_tokens=4,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=23/500000]
+ train/ActionNoiseL2Loss=1.329
+ throughput/total_tokens=4,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=24/500000]
+ train/ActionNoiseL2Loss=1.480
+ throughput/total_tokens=4,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=25/500000]
+ train/ActionNoiseL2Loss=1.293
+ throughput/total_tokens=4,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=26/500000]
+ train/ActionNoiseL2Loss=1.370
+ throughput/total_tokens=4,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=27/500000]
+ train/ActionNoiseL2Loss=1.457
+ throughput/total_tokens=5,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=28/500000]
+ train/ActionNoiseL2Loss=1.421
+ throughput/total_tokens=5,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=29/500000]
+ train/ActionNoiseL2Loss=1.430
+ throughput/total_tokens=5,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=30/500000]
+ train/ActionNoiseL2Loss=1.286
+ throughput/total_tokens=5,760,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=31/500000]
+ train/ActionNoiseL2Loss=1.326
+ throughput/total_tokens=5,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=32/500000]
+ train/ActionNoiseL2Loss=1.165
+ throughput/total_tokens=6,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=33/500000]
+ train/ActionNoiseL2Loss=1.290
+ throughput/total_tokens=6,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=34/500000]
+ train/ActionNoiseL2Loss=1.303
+ throughput/total_tokens=6,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=35/500000]
+ train/ActionNoiseL2Loss=1.179
+ throughput/total_tokens=6,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=36/500000]
+ train/ActionNoiseL2Loss=1.308
+ throughput/total_tokens=6,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=37/500000]
+ train/ActionNoiseL2Loss=1.182
+ throughput/total_tokens=7,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=38/500000]
+ train/ActionNoiseL2Loss=1.176
+ throughput/total_tokens=7,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=39/500000]
+ train/ActionNoiseL2Loss=1.257
+ throughput/total_tokens=7,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=40/500000]
+ optim/total_grad_norm=13.02
+ train/ActionNoiseL2Loss=1.165
+ throughput/total_tokens=7,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=41/500000]
+ train/ActionNoiseL2Loss=1.149
+ throughput/total_tokens=7,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=42/500000]
+ train/ActionNoiseL2Loss=1.172
+ throughput/total_tokens=8,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=43/500000]
+ train/ActionNoiseL2Loss=1.268
+ throughput/total_tokens=8,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=44/500000]
+ train/ActionNoiseL2Loss=1.381
+ throughput/total_tokens=8,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=45/500000]
+ train/ActionNoiseL2Loss=1.126
+ throughput/total_tokens=8,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=46/500000]
+ train/ActionNoiseL2Loss=1.103
+ throughput/total_tokens=8,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=47/500000]
+ train/ActionNoiseL2Loss=1.153
+ throughput/total_tokens=9,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=48/500000]
+ train/ActionNoiseL2Loss=1.172
+ throughput/total_tokens=9,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=49/500000]
+ train/ActionNoiseL2Loss=1.084
+ throughput/total_tokens=9,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=50/500000]
+ train/ActionNoiseL2Loss=1.240
+ throughput/total_tokens=9,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=51/500000]
+ train/ActionNoiseL2Loss=1.187
+ throughput/total_tokens=9,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=52/500000]
+ train/ActionNoiseL2Loss=1.109
+ throughput/total_tokens=9,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=53/500000]
+ train/ActionNoiseL2Loss=1.135
+ throughput/total_tokens=10,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=54/500000]
+ train/ActionNoiseL2Loss=1.211
+ throughput/total_tokens=10,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=55/500000]
+ train/ActionNoiseL2Loss=1.045
+ throughput/total_tokens=10,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=56/500000]
+ train/ActionNoiseL2Loss=1.149
+ throughput/total_tokens=10,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=57/500000]
+ train/ActionNoiseL2Loss=1.213
+ throughput/total_tokens=10,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=58/500000]
+ train/ActionNoiseL2Loss=1.137
+ throughput/total_tokens=11,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=59/500000]
+ train/ActionNoiseL2Loss=1.123
+ throughput/total_tokens=11,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=60/500000]
+ optim/total_grad_norm=16.09
+ train/ActionNoiseL2Loss=1.096
+ throughput/total_tokens=11,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=61/500000]
+ train/ActionNoiseL2Loss=1.102
+ throughput/total_tokens=11,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=62/500000]
+ train/ActionNoiseL2Loss=1.076
+ throughput/total_tokens=11,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=63/500000]
+ train/ActionNoiseL2Loss=1.056
+ throughput/total_tokens=12,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=64/500000]
+ train/ActionNoiseL2Loss=0.9842
+ throughput/total_tokens=12,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=65/500000]
+ train/ActionNoiseL2Loss=1.127
+ throughput/total_tokens=12,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=66/500000]
+ train/ActionNoiseL2Loss=1.099
+ throughput/total_tokens=12,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=67/500000]
+ train/ActionNoiseL2Loss=0.9832
+ throughput/total_tokens=12,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=68/500000]
+ train/ActionNoiseL2Loss=1.106
+ throughput/total_tokens=13,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=69/500000]
+ train/ActionNoiseL2Loss=1.028
+ throughput/total_tokens=13,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=70/500000]
+ train/ActionNoiseL2Loss=1.011
+ throughput/total_tokens=13,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=71/500000]
+ train/ActionNoiseL2Loss=1.005
+ throughput/total_tokens=13,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=72/500000]
+ train/ActionNoiseL2Loss=0.9974
+ throughput/total_tokens=13,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=73/500000]
+ train/ActionNoiseL2Loss=1.012
+ throughput/total_tokens=14,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=74/500000]
+ train/ActionNoiseL2Loss=1.003
+ throughput/total_tokens=14,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=75/500000]
+ train/ActionNoiseL2Loss=0.9863
+ throughput/total_tokens=14,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=76/500000]
+ train/ActionNoiseL2Loss=0.9746
+ throughput/total_tokens=14,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=77/500000]
+ train/ActionNoiseL2Loss=0.9308
+ throughput/total_tokens=14,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=78/500000]
+ train/ActionNoiseL2Loss=0.9764
+ throughput/total_tokens=14,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=79/500000]
+ train/ActionNoiseL2Loss=1.121
+ throughput/total_tokens=15,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=80/500000]
+ optim/total_grad_norm=15.62
+ train/ActionNoiseL2Loss=0.9447
+ throughput/total_tokens=15,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=81/500000]
+ train/ActionNoiseL2Loss=1.194
+ throughput/total_tokens=15,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=82/500000]
+ train/ActionNoiseL2Loss=1.063
+ throughput/total_tokens=15,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=83/500000]
+ train/ActionNoiseL2Loss=1.056
+ throughput/total_tokens=15,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=84/500000]
+ train/ActionNoiseL2Loss=1.069
+ throughput/total_tokens=16,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=85/500000]
+ train/ActionNoiseL2Loss=1.200
+ throughput/total_tokens=16,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=86/500000]
+ train/ActionNoiseL2Loss=0.9582
+ throughput/total_tokens=16,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=87/500000]
+ train/ActionNoiseL2Loss=0.9938
+ throughput/total_tokens=16,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=88/500000]
+ train/ActionNoiseL2Loss=0.9740
+ throughput/total_tokens=16,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=89/500000]
+ train/ActionNoiseL2Loss=1.064
+ throughput/total_tokens=17,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=90/500000]
+ train/ActionNoiseL2Loss=0.8568
+ throughput/total_tokens=17,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=91/500000]
+ train/ActionNoiseL2Loss=0.9748
+ throughput/total_tokens=17,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=92/500000]
+ train/ActionNoiseL2Loss=0.9276
+ throughput/total_tokens=17,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=93/500000]
+ train/ActionNoiseL2Loss=0.9539
+ throughput/total_tokens=17,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=94/500000]
+ train/ActionNoiseL2Loss=0.8286
+ throughput/total_tokens=18,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=95/500000]
+ train/ActionNoiseL2Loss=0.9718
+ throughput/total_tokens=18,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=96/500000]
+ train/ActionNoiseL2Loss=0.9655
+ throughput/total_tokens=18,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=97/500000]
+ train/ActionNoiseL2Loss=0.8137
+ throughput/total_tokens=18,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=98/500000]
+ train/ActionNoiseL2Loss=1.096
+ throughput/total_tokens=18,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=99/500000]
+ train/ActionNoiseL2Loss=0.8410
+ throughput/total_tokens=19,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=100/500000]
+ optim/total_grad_norm=16.47
+ train/ActionNoiseL2Loss=0.9397
+ throughput/total_tokens=19,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=101/500000]
+ train/ActionNoiseL2Loss=0.9152
+ throughput/total_tokens=19,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=102/500000]
+ train/ActionNoiseL2Loss=0.8826
+ throughput/total_tokens=19,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=103/500000]
+ train/ActionNoiseL2Loss=0.7942
+ throughput/total_tokens=19,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=104/500000]
+ train/ActionNoiseL2Loss=0.9235
+ throughput/total_tokens=19,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=105/500000]
+ train/ActionNoiseL2Loss=0.9592
+ throughput/total_tokens=20,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=106/500000]
+ train/ActionNoiseL2Loss=0.9190
+ throughput/total_tokens=20,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=107/500000]
+ train/ActionNoiseL2Loss=0.8932
+ throughput/total_tokens=20,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=108/500000]
+ train/ActionNoiseL2Loss=0.9262
+ throughput/total_tokens=20,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=109/500000]
+ train/ActionNoiseL2Loss=0.8150
+ throughput/total_tokens=20,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=110/500000]
+ train/ActionNoiseL2Loss=0.7403
+ throughput/total_tokens=21,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=111/500000]
+ train/ActionNoiseL2Loss=0.7451
+ throughput/total_tokens=21,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=112/500000]
+ train/ActionNoiseL2Loss=1.023
+ throughput/total_tokens=21,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=113/500000]
+ train/ActionNoiseL2Loss=0.8363
+ throughput/total_tokens=21,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=114/500000]
+ train/ActionNoiseL2Loss=0.9321
+ throughput/total_tokens=21,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=115/500000]
+ train/ActionNoiseL2Loss=0.9400
+ throughput/total_tokens=22,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=116/500000]
+ train/ActionNoiseL2Loss=0.7540
+ throughput/total_tokens=22,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=117/500000]
+ train/ActionNoiseL2Loss=0.9090
+ throughput/total_tokens=22,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=118/500000]
+ train/ActionNoiseL2Loss=0.9457
+ throughput/total_tokens=22,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=119/500000]
+ train/ActionNoiseL2Loss=0.7702
+ throughput/total_tokens=22,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=120/500000]
+ optim/total_grad_norm=14.92
+ train/ActionNoiseL2Loss=0.9145
+ throughput/total_tokens=23,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=121/500000]
+ train/ActionNoiseL2Loss=0.8528
+ throughput/total_tokens=23,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=122/500000]
+ train/ActionNoiseL2Loss=0.9821
+ throughput/total_tokens=23,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=123/500000]
+ train/ActionNoiseL2Loss=0.9461
+ throughput/total_tokens=23,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=124/500000]
+ train/ActionNoiseL2Loss=0.8982
+ throughput/total_tokens=23,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=125/500000]
+ train/ActionNoiseL2Loss=0.7940
+ throughput/total_tokens=24,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=126/500000]
+ train/ActionNoiseL2Loss=0.8629
+ throughput/total_tokens=24,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=127/500000]
+ train/ActionNoiseL2Loss=0.7471
+ throughput/total_tokens=24,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=128/500000]
+ train/ActionNoiseL2Loss=1.107
+ throughput/total_tokens=24,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=129/500000]
+ train/ActionNoiseL2Loss=0.8590
+ throughput/total_tokens=24,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=130/500000]
+ train/ActionNoiseL2Loss=0.7386
+ throughput/total_tokens=24,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=131/500000]
+ train/ActionNoiseL2Loss=0.9495
+ throughput/total_tokens=25,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=132/500000]
+ train/ActionNoiseL2Loss=0.7587
+ throughput/total_tokens=25,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=133/500000]
+ train/ActionNoiseL2Loss=0.9139
+ throughput/total_tokens=25,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=134/500000]
+ train/ActionNoiseL2Loss=0.8664
+ throughput/total_tokens=25,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=135/500000]
+ train/ActionNoiseL2Loss=0.7986
+ throughput/total_tokens=25,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=136/500000]
+ train/ActionNoiseL2Loss=0.8178
+ throughput/total_tokens=26,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=137/500000]
+ train/ActionNoiseL2Loss=0.8644
+ throughput/total_tokens=26,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=138/500000]
+ train/ActionNoiseL2Loss=0.7932
+ throughput/total_tokens=26,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=139/500000]
+ train/ActionNoiseL2Loss=0.7111
+ throughput/total_tokens=26,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=140/500000]
+ optim/total_grad_norm=17.31
+ train/ActionNoiseL2Loss=0.9098
+ throughput/total_tokens=26,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=141/500000]
+ train/ActionNoiseL2Loss=0.6431
+ throughput/total_tokens=27,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=142/500000]
+ train/ActionNoiseL2Loss=0.7603
+ throughput/total_tokens=27,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=143/500000]
+ train/ActionNoiseL2Loss=0.8460
+ throughput/total_tokens=27,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=144/500000]
+ train/ActionNoiseL2Loss=0.7858
+ throughput/total_tokens=27,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=145/500000]
+ train/ActionNoiseL2Loss=0.8970
+ throughput/total_tokens=27,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=146/500000]
+ train/ActionNoiseL2Loss=0.7955
+ throughput/total_tokens=28,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=147/500000]
+ train/ActionNoiseL2Loss=0.6513
+ throughput/total_tokens=28,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=148/500000]
+ train/ActionNoiseL2Loss=0.6873
+ throughput/total_tokens=28,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=149/500000]
+ train/ActionNoiseL2Loss=0.6878
+ throughput/total_tokens=28,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=150/500000]
+ train/ActionNoiseL2Loss=0.7085
+ throughput/total_tokens=28,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=151/500000]
+ train/ActionNoiseL2Loss=0.7069
+ throughput/total_tokens=28,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=152/500000]
+ train/ActionNoiseL2Loss=0.7803
+ throughput/total_tokens=29,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=153/500000]
+ train/ActionNoiseL2Loss=0.6405
+ throughput/total_tokens=29,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=154/500000]
+ train/ActionNoiseL2Loss=0.7533
+ throughput/total_tokens=29,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=155/500000]
+ train/ActionNoiseL2Loss=0.7764
+ throughput/total_tokens=29,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=156/500000]
+ train/ActionNoiseL2Loss=0.6081
+ throughput/total_tokens=29,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=157/500000]
+ train/ActionNoiseL2Loss=0.8819
+ throughput/total_tokens=30,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=158/500000]
+ train/ActionNoiseL2Loss=0.5686
+ throughput/total_tokens=30,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=159/500000]
+ train/ActionNoiseL2Loss=0.6180
+ throughput/total_tokens=30,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=160/500000]
+ optim/total_grad_norm=11.85
+ train/ActionNoiseL2Loss=0.7053
+ throughput/total_tokens=30,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=161/500000]
+ train/ActionNoiseL2Loss=0.6708
+ throughput/total_tokens=30,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=162/500000]
+ train/ActionNoiseL2Loss=0.5856
+ throughput/total_tokens=31,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=163/500000]
+ train/ActionNoiseL2Loss=0.5904
+ throughput/total_tokens=31,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=164/500000]
+ train/ActionNoiseL2Loss=0.7964
+ throughput/total_tokens=31,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=165/500000]
+ train/ActionNoiseL2Loss=0.7435
+ throughput/total_tokens=31,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=166/500000]
+ train/ActionNoiseL2Loss=0.7593
+ throughput/total_tokens=31,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=167/500000]
+ train/ActionNoiseL2Loss=0.6268
+ throughput/total_tokens=32,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=168/500000]
+ train/ActionNoiseL2Loss=0.6713
+ throughput/total_tokens=32,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=169/500000]
+ train/ActionNoiseL2Loss=0.5795
+ throughput/total_tokens=32,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=170/500000]
+ train/ActionNoiseL2Loss=0.7079
+ throughput/total_tokens=32,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=171/500000]
+ train/ActionNoiseL2Loss=0.6530
+ throughput/total_tokens=32,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=172/500000]
+ train/ActionNoiseL2Loss=0.5171
+ throughput/total_tokens=33,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=173/500000]
+ train/ActionNoiseL2Loss=0.5461
+ throughput/total_tokens=33,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=174/500000]
+ train/ActionNoiseL2Loss=0.6566
+ throughput/total_tokens=33,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=175/500000]
+ train/ActionNoiseL2Loss=0.6948
+ throughput/total_tokens=33,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=176/500000]
+ train/ActionNoiseL2Loss=0.5512
+ throughput/total_tokens=33,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=177/500000]
+ train/ActionNoiseL2Loss=0.5432
+ throughput/total_tokens=33,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=178/500000]
+ train/ActionNoiseL2Loss=0.7932
+ throughput/total_tokens=34,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=179/500000]
+ train/ActionNoiseL2Loss=0.6048
+ throughput/total_tokens=34,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=180/500000]
+ optim/total_grad_norm=11.22
+ train/ActionNoiseL2Loss=0.5070
+ throughput/total_tokens=34,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=181/500000]
+ train/ActionNoiseL2Loss=0.5100
+ throughput/total_tokens=34,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=182/500000]
+ train/ActionNoiseL2Loss=0.5693
+ throughput/total_tokens=34,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=183/500000]
+ train/ActionNoiseL2Loss=0.6890
+ throughput/total_tokens=35,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=184/500000]
+ train/ActionNoiseL2Loss=0.6035
+ throughput/total_tokens=35,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=185/500000]
+ train/ActionNoiseL2Loss=0.5582
+ throughput/total_tokens=35,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=186/500000]
+ train/ActionNoiseL2Loss=0.4891
+ throughput/total_tokens=35,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=187/500000]
+ train/ActionNoiseL2Loss=0.4751
+ throughput/total_tokens=35,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=188/500000]
+ train/ActionNoiseL2Loss=0.5067
+ throughput/total_tokens=36,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=189/500000]
+ train/ActionNoiseL2Loss=0.7055
+ throughput/total_tokens=36,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=190/500000]
+ train/ActionNoiseL2Loss=0.4573
+ throughput/total_tokens=36,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=191/500000]
+ train/ActionNoiseL2Loss=0.5257
+ throughput/total_tokens=36,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=192/500000]
+ train/ActionNoiseL2Loss=0.4763
+ throughput/total_tokens=36,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=193/500000]
+ train/ActionNoiseL2Loss=0.4740
+ throughput/total_tokens=37,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=194/500000]
+ train/ActionNoiseL2Loss=0.5640
+ throughput/total_tokens=37,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=195/500000]
+ train/ActionNoiseL2Loss=0.6211
+ throughput/total_tokens=37,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=196/500000]
+ train/ActionNoiseL2Loss=0.5364
+ throughput/total_tokens=37,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=197/500000]
+ train/ActionNoiseL2Loss=0.5117
+ throughput/total_tokens=37,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=198/500000]
+ train/ActionNoiseL2Loss=0.4413
+ throughput/total_tokens=38,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=199/500000]
+ train/ActionNoiseL2Loss=0.4828
+ throughput/total_tokens=38,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=200/500000]
+ optim/total_grad_norm=11.75
+ train/ActionNoiseL2Loss=0.4356
+ throughput/total_tokens=38,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=201/500000]
+ train/ActionNoiseL2Loss=0.4575
+ throughput/total_tokens=38,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=202/500000]
+ train/ActionNoiseL2Loss=0.6371
+ throughput/total_tokens=38,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=203/500000]
+ train/ActionNoiseL2Loss=0.4458
+ throughput/total_tokens=38,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=204/500000]
+ train/ActionNoiseL2Loss=0.5416
+ throughput/total_tokens=39,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=205/500000]
+ train/ActionNoiseL2Loss=0.4228
+ throughput/total_tokens=39,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=206/500000]
+ train/ActionNoiseL2Loss=0.5197
+ throughput/total_tokens=39,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=207/500000]
+ train/ActionNoiseL2Loss=0.6798
+ throughput/total_tokens=39,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=208/500000]
+ train/ActionNoiseL2Loss=0.4516
+ throughput/total_tokens=39,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=209/500000]
+ train/ActionNoiseL2Loss=0.4592
+ throughput/total_tokens=40,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=210/500000]
+ train/ActionNoiseL2Loss=0.4034
+ throughput/total_tokens=40,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=211/500000]
+ train/ActionNoiseL2Loss=0.6104
+ throughput/total_tokens=40,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=212/500000]
+ train/ActionNoiseL2Loss=0.4670
+ throughput/total_tokens=40,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=213/500000]
+ train/ActionNoiseL2Loss=0.4163
+ throughput/total_tokens=40,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=214/500000]
+ train/ActionNoiseL2Loss=0.3328
+ throughput/total_tokens=41,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=215/500000]
+ train/ActionNoiseL2Loss=0.4985
+ throughput/total_tokens=41,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=216/500000]
+ train/ActionNoiseL2Loss=0.5983
+ throughput/total_tokens=41,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=217/500000]
+ train/ActionNoiseL2Loss=0.4684
+ throughput/total_tokens=41,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=218/500000]
+ train/ActionNoiseL2Loss=0.4951
+ throughput/total_tokens=41,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=219/500000]
+ train/ActionNoiseL2Loss=0.4426
+ throughput/total_tokens=42,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=220/500000]
+ optim/total_grad_norm=13.09
+ train/ActionNoiseL2Loss=0.5668
+ throughput/total_tokens=42,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=221/500000]
+ train/ActionNoiseL2Loss=0.4278
+ throughput/total_tokens=42,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=222/500000]
+ train/ActionNoiseL2Loss=0.3641
+ throughput/total_tokens=42,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=223/500000]
+ train/ActionNoiseL2Loss=0.3579
+ throughput/total_tokens=42,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=224/500000]
+ train/ActionNoiseL2Loss=0.3929
+ throughput/total_tokens=43,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=225/500000]
+ train/ActionNoiseL2Loss=0.3892
+ throughput/total_tokens=43,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=226/500000]
+ train/ActionNoiseL2Loss=0.5716
+ throughput/total_tokens=43,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=227/500000]
+ train/ActionNoiseL2Loss=0.4569
+ throughput/total_tokens=43,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=228/500000]
+ train/ActionNoiseL2Loss=0.4471
+ throughput/total_tokens=43,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=229/500000]
+ train/ActionNoiseL2Loss=0.5860
+ throughput/total_tokens=43,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=230/500000]
+ train/ActionNoiseL2Loss=0.3782
+ throughput/total_tokens=44,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=231/500000]
+ train/ActionNoiseL2Loss=0.5182
+ throughput/total_tokens=44,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=232/500000]
+ train/ActionNoiseL2Loss=0.4356
+ throughput/total_tokens=44,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=233/500000]
+ train/ActionNoiseL2Loss=0.3935
+ throughput/total_tokens=44,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=234/500000]
+ train/ActionNoiseL2Loss=0.5163
+ throughput/total_tokens=44,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=235/500000]
+ train/ActionNoiseL2Loss=0.5726
+ throughput/total_tokens=45,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=236/500000]
+ train/ActionNoiseL2Loss=0.4442
+ throughput/total_tokens=45,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=237/500000]
+ train/ActionNoiseL2Loss=0.4738
+ throughput/total_tokens=45,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=238/500000]
+ train/ActionNoiseL2Loss=0.4137
+ throughput/total_tokens=45,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=239/500000]
+ train/ActionNoiseL2Loss=0.3336
+ throughput/total_tokens=45,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=240/500000]
+ optim/total_grad_norm=12.69
+ train/ActionNoiseL2Loss=0.4608
+ throughput/total_tokens=46,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=241/500000]
+ train/ActionNoiseL2Loss=0.4961
+ throughput/total_tokens=46,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=242/500000]
+ train/ActionNoiseL2Loss=0.4917
+ throughput/total_tokens=46,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=243/500000]
+ train/ActionNoiseL2Loss=0.3697
+ throughput/total_tokens=46,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=244/500000]
+ train/ActionNoiseL2Loss=0.4366
+ throughput/total_tokens=46,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=245/500000]
+ train/ActionNoiseL2Loss=0.4089
+ throughput/total_tokens=47,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=246/500000]
+ train/ActionNoiseL2Loss=0.3325
+ throughput/total_tokens=47,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=247/500000]
+ train/ActionNoiseL2Loss=0.5123
+ throughput/total_tokens=47,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=248/500000]
+ train/ActionNoiseL2Loss=0.4271
+ throughput/total_tokens=47,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=249/500000]
+ train/ActionNoiseL2Loss=0.5656
+ throughput/total_tokens=47,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=250/500000]
+ train/ActionNoiseL2Loss=0.3705
+ throughput/total_tokens=48,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=251/500000]
+ train/ActionNoiseL2Loss=0.3925
+ throughput/total_tokens=48,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=252/500000]
+ train/ActionNoiseL2Loss=0.3123
+ throughput/total_tokens=48,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=253/500000]
+ train/ActionNoiseL2Loss=0.4515
+ throughput/total_tokens=48,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=254/500000]
+ train/ActionNoiseL2Loss=0.3438
+ throughput/total_tokens=48,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=255/500000]
+ train/ActionNoiseL2Loss=0.2553
+ throughput/total_tokens=48,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=256/500000]
+ train/ActionNoiseL2Loss=0.4948
+ throughput/total_tokens=49,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=257/500000]
+ train/ActionNoiseL2Loss=0.4004
+ throughput/total_tokens=49,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=258/500000]
+ train/ActionNoiseL2Loss=0.3885
+ throughput/total_tokens=49,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=259/500000]
+ train/ActionNoiseL2Loss=0.4656
+ throughput/total_tokens=49,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=260/500000]
+ optim/total_grad_norm=16.23
+ train/ActionNoiseL2Loss=0.4797
+ throughput/total_tokens=49,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=261/500000]
+ train/ActionNoiseL2Loss=0.3388
+ throughput/total_tokens=50,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=262/500000]
+ train/ActionNoiseL2Loss=0.3405
+ throughput/total_tokens=50,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=263/500000]
+ train/ActionNoiseL2Loss=0.3834
+ throughput/total_tokens=50,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=264/500000]
+ train/ActionNoiseL2Loss=0.3920
+ throughput/total_tokens=50,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=265/500000]
+ train/ActionNoiseL2Loss=0.4444
+ throughput/total_tokens=50,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=266/500000]
+ train/ActionNoiseL2Loss=0.3747
+ throughput/total_tokens=51,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=267/500000]
+ train/ActionNoiseL2Loss=0.3592
+ throughput/total_tokens=51,264,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=268/500000]
+ train/ActionNoiseL2Loss=0.3444
+ throughput/total_tokens=51,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=269/500000]
+ train/ActionNoiseL2Loss=0.4368
+ throughput/total_tokens=51,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=270/500000]
+ train/ActionNoiseL2Loss=0.4904
+ throughput/total_tokens=51,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=271/500000]
+ train/ActionNoiseL2Loss=0.5716
+ throughput/total_tokens=52,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=272/500000]
+ train/ActionNoiseL2Loss=0.3977
+ throughput/total_tokens=52,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=273/500000]
+ train/ActionNoiseL2Loss=0.4266
+ throughput/total_tokens=52,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=274/500000]
+ train/ActionNoiseL2Loss=0.4295
+ throughput/total_tokens=52,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=275/500000]
+ train/ActionNoiseL2Loss=0.3712
+ throughput/total_tokens=52,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=276/500000]
+ train/ActionNoiseL2Loss=0.3865
+ throughput/total_tokens=52,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=277/500000]
+ train/ActionNoiseL2Loss=0.4560
+ throughput/total_tokens=53,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=278/500000]
+ train/ActionNoiseL2Loss=0.4521
+ throughput/total_tokens=53,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=279/500000]
+ train/ActionNoiseL2Loss=0.4552
+ throughput/total_tokens=53,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=280/500000]
+ optim/total_grad_norm=13.07
+ train/ActionNoiseL2Loss=0.4681
+ throughput/total_tokens=53,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=281/500000]
+ train/ActionNoiseL2Loss=0.4110
+ throughput/total_tokens=53,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=282/500000]
+ train/ActionNoiseL2Loss=0.5004
+ throughput/total_tokens=54,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=283/500000]
+ train/ActionNoiseL2Loss=0.3981
+ throughput/total_tokens=54,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=284/500000]
+ train/ActionNoiseL2Loss=0.3851
+ throughput/total_tokens=54,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=285/500000]
+ train/ActionNoiseL2Loss=0.3053
+ throughput/total_tokens=54,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=286/500000]
+ train/ActionNoiseL2Loss=0.4473
+ throughput/total_tokens=54,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=287/500000]
+ train/ActionNoiseL2Loss=0.5383
+ throughput/total_tokens=55,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=288/500000]
+ train/ActionNoiseL2Loss=0.4718
+ throughput/total_tokens=55,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=289/500000]
+ train/ActionNoiseL2Loss=0.5555
+ throughput/total_tokens=55,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=290/500000]
+ train/ActionNoiseL2Loss=0.4510
+ throughput/total_tokens=55,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=291/500000]
+ train/ActionNoiseL2Loss=0.3876
+ throughput/total_tokens=55,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=292/500000]
+ train/ActionNoiseL2Loss=0.3142
+ throughput/total_tokens=56,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=293/500000]
+ train/ActionNoiseL2Loss=0.3511
+ throughput/total_tokens=56,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=294/500000]
+ train/ActionNoiseL2Loss=0.2661
+ throughput/total_tokens=56,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=295/500000]
+ train/ActionNoiseL2Loss=0.2540
+ throughput/total_tokens=56,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=296/500000]
+ train/ActionNoiseL2Loss=0.3017
+ throughput/total_tokens=56,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=297/500000]
+ train/ActionNoiseL2Loss=0.4130
+ throughput/total_tokens=57,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=298/500000]
+ train/ActionNoiseL2Loss=0.4127
+ throughput/total_tokens=57,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=299/500000]
+ train/ActionNoiseL2Loss=0.2996
+ throughput/total_tokens=57,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=300/500000]
+ optim/total_grad_norm=13.65
+ train/ActionNoiseL2Loss=0.5173
+ throughput/total_tokens=57,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=301/500000]
+ train/ActionNoiseL2Loss=0.4040
+ throughput/total_tokens=57,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=302/500000]
+ train/ActionNoiseL2Loss=0.3114
+ throughput/total_tokens=57,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=303/500000]
+ train/ActionNoiseL2Loss=0.2554
+ throughput/total_tokens=58,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=304/500000]
+ train/ActionNoiseL2Loss=0.3394
+ throughput/total_tokens=58,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=305/500000]
+ train/ActionNoiseL2Loss=0.3654
+ throughput/total_tokens=58,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=306/500000]
+ train/ActionNoiseL2Loss=0.4049
+ throughput/total_tokens=58,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=307/500000]
+ train/ActionNoiseL2Loss=0.4614
+ throughput/total_tokens=58,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=308/500000]
+ train/ActionNoiseL2Loss=0.3893
+ throughput/total_tokens=59,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=309/500000]
+ train/ActionNoiseL2Loss=0.3601
+ throughput/total_tokens=59,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=310/500000]
+ train/ActionNoiseL2Loss=0.3908
+ throughput/total_tokens=59,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=311/500000]
+ train/ActionNoiseL2Loss=0.3192
+ throughput/total_tokens=59,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=312/500000]
+ train/ActionNoiseL2Loss=0.3051
+ throughput/total_tokens=59,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=313/500000]
+ train/ActionNoiseL2Loss=0.3850
+ throughput/total_tokens=60,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=314/500000]
+ train/ActionNoiseL2Loss=0.2636
+ throughput/total_tokens=60,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=315/500000]
+ train/ActionNoiseL2Loss=0.2839
+ throughput/total_tokens=60,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=316/500000]
+ train/ActionNoiseL2Loss=0.3569
+ throughput/total_tokens=60,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=317/500000]
+ train/ActionNoiseL2Loss=0.2544
+ throughput/total_tokens=60,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=318/500000]
+ train/ActionNoiseL2Loss=0.3130
+ throughput/total_tokens=61,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=319/500000]
+ train/ActionNoiseL2Loss=0.3441
+ throughput/total_tokens=61,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=320/500000]
+ optim/total_grad_norm=9.259
+ train/ActionNoiseL2Loss=0.2376
+ throughput/total_tokens=61,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=321/500000]
+ train/ActionNoiseL2Loss=0.3717
+ throughput/total_tokens=61,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=322/500000]
+ train/ActionNoiseL2Loss=0.4892
+ throughput/total_tokens=61,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=323/500000]
+ train/ActionNoiseL2Loss=0.3744
+ throughput/total_tokens=62,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=324/500000]
+ train/ActionNoiseL2Loss=0.3255
+ throughput/total_tokens=62,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=325/500000]
+ train/ActionNoiseL2Loss=0.5037
+ throughput/total_tokens=62,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=326/500000]
+ train/ActionNoiseL2Loss=0.3345
+ throughput/total_tokens=62,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=327/500000]
+ train/ActionNoiseL2Loss=0.3774
+ throughput/total_tokens=62,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=328/500000]
+ train/ActionNoiseL2Loss=0.3567
+ throughput/total_tokens=62,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=329/500000]
+ train/ActionNoiseL2Loss=0.3371
+ throughput/total_tokens=63,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=330/500000]
+ train/ActionNoiseL2Loss=0.4519
+ throughput/total_tokens=63,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=331/500000]
+ train/ActionNoiseL2Loss=0.3184
+ throughput/total_tokens=63,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=332/500000]
+ train/ActionNoiseL2Loss=0.3081
+ throughput/total_tokens=63,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=333/500000]
+ train/ActionNoiseL2Loss=0.3123
+ throughput/total_tokens=63,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=334/500000]
+ train/ActionNoiseL2Loss=0.2981
+ throughput/total_tokens=64,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=335/500000]
+ train/ActionNoiseL2Loss=0.1838
+ throughput/total_tokens=64,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=336/500000]
+ train/ActionNoiseL2Loss=0.2333
+ throughput/total_tokens=64,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=337/500000]
+ train/ActionNoiseL2Loss=0.4054
+ throughput/total_tokens=64,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=338/500000]
+ train/ActionNoiseL2Loss=0.5336
+ throughput/total_tokens=64,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=339/500000]
+ train/ActionNoiseL2Loss=0.5329
+ throughput/total_tokens=65,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=340/500000]
+ optim/total_grad_norm=8.187
+ train/ActionNoiseL2Loss=0.2210
+ throughput/total_tokens=65,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=341/500000]
+ train/ActionNoiseL2Loss=0.3905
+ throughput/total_tokens=65,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=342/500000]
+ train/ActionNoiseL2Loss=0.3963
+ throughput/total_tokens=65,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=343/500000]
+ train/ActionNoiseL2Loss=0.2869
+ throughput/total_tokens=65,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=344/500000]
+ train/ActionNoiseL2Loss=0.2081
+ throughput/total_tokens=66,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=345/500000]
+ train/ActionNoiseL2Loss=0.3726
+ throughput/total_tokens=66,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=346/500000]
+ train/ActionNoiseL2Loss=0.2696
+ throughput/total_tokens=66,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=347/500000]
+ train/ActionNoiseL2Loss=0.2602
+ throughput/total_tokens=66,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=348/500000]
+ train/ActionNoiseL2Loss=0.3309
+ throughput/total_tokens=66,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=349/500000]
+ train/ActionNoiseL2Loss=0.5278
+ throughput/total_tokens=67,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=350/500000]
+ train/ActionNoiseL2Loss=0.2919
+ throughput/total_tokens=67,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=351/500000]
+ train/ActionNoiseL2Loss=0.3379
+ throughput/total_tokens=67,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=352/500000]
+ train/ActionNoiseL2Loss=0.3761
+ throughput/total_tokens=67,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=353/500000]
+ train/ActionNoiseL2Loss=0.3491
+ throughput/total_tokens=67,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=354/500000]
+ train/ActionNoiseL2Loss=0.2486
+ throughput/total_tokens=67,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=355/500000]
+ train/ActionNoiseL2Loss=0.3874
+ throughput/total_tokens=68,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=356/500000]
+ train/ActionNoiseL2Loss=0.3978
+ throughput/total_tokens=68,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=357/500000]
+ train/ActionNoiseL2Loss=0.3930
+ throughput/total_tokens=68,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=358/500000]
+ train/ActionNoiseL2Loss=0.4914
+ throughput/total_tokens=68,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=359/500000]
+ train/ActionNoiseL2Loss=0.2693
+ throughput/total_tokens=68,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=360/500000]
+ optim/total_grad_norm=6.301
+ train/ActionNoiseL2Loss=0.2504
+ throughput/total_tokens=69,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=361/500000]
+ train/ActionNoiseL2Loss=0.2591
+ throughput/total_tokens=69,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=362/500000]
+ train/ActionNoiseL2Loss=0.4502
+ throughput/total_tokens=69,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=363/500000]
+ train/ActionNoiseL2Loss=0.3290
+ throughput/total_tokens=69,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=364/500000]
+ train/ActionNoiseL2Loss=0.3103
+ throughput/total_tokens=69,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=365/500000]
+ train/ActionNoiseL2Loss=0.3201
+ throughput/total_tokens=70,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=366/500000]
+ train/ActionNoiseL2Loss=0.3782
+ throughput/total_tokens=70,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=367/500000]
+ train/ActionNoiseL2Loss=0.3367
+ throughput/total_tokens=70,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=368/500000]
+ train/ActionNoiseL2Loss=0.3225
+ throughput/total_tokens=70,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=369/500000]
+ train/ActionNoiseL2Loss=0.2389
+ throughput/total_tokens=70,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=370/500000]
+ train/ActionNoiseL2Loss=0.2901
+ throughput/total_tokens=71,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=371/500000]
+ train/ActionNoiseL2Loss=0.2844
+ throughput/total_tokens=71,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=372/500000]
+ train/ActionNoiseL2Loss=0.2650
+ throughput/total_tokens=71,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=373/500000]
+ train/ActionNoiseL2Loss=0.2752
+ throughput/total_tokens=71,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=374/500000]
+ train/ActionNoiseL2Loss=0.3856
+ throughput/total_tokens=71,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=375/500000]
+ train/ActionNoiseL2Loss=0.4024
+ throughput/total_tokens=72,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=376/500000]
+ train/ActionNoiseL2Loss=0.4087
+ throughput/total_tokens=72,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=377/500000]
+ train/ActionNoiseL2Loss=0.4180
+ throughput/total_tokens=72,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=378/500000]
+ train/ActionNoiseL2Loss=0.3121
+ throughput/total_tokens=72,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=379/500000]
+ train/ActionNoiseL2Loss=0.2809
+ throughput/total_tokens=72,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=380/500000]
+ optim/total_grad_norm=10.50
+ train/ActionNoiseL2Loss=0.2958
+ throughput/total_tokens=72,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=381/500000]
+ train/ActionNoiseL2Loss=0.2642
+ throughput/total_tokens=73,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=382/500000]
+ train/ActionNoiseL2Loss=0.2577
+ throughput/total_tokens=73,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=383/500000]
+ train/ActionNoiseL2Loss=0.5013
+ throughput/total_tokens=73,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=384/500000]
+ train/ActionNoiseL2Loss=0.3480
+ throughput/total_tokens=73,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=385/500000]
+ train/ActionNoiseL2Loss=0.2947
+ throughput/total_tokens=73,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=386/500000]
+ train/ActionNoiseL2Loss=0.3648
+ throughput/total_tokens=74,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=387/500000]
+ train/ActionNoiseL2Loss=0.2587
+ throughput/total_tokens=74,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=388/500000]
+ train/ActionNoiseL2Loss=0.2441
+ throughput/total_tokens=74,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=389/500000]
+ train/ActionNoiseL2Loss=0.2421
+ throughput/total_tokens=74,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=390/500000]
+ train/ActionNoiseL2Loss=0.1880
+ throughput/total_tokens=74,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=391/500000]
+ train/ActionNoiseL2Loss=0.3875
+ throughput/total_tokens=75,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=392/500000]
+ train/ActionNoiseL2Loss=0.3027
+ throughput/total_tokens=75,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=393/500000]
+ train/ActionNoiseL2Loss=0.2969
+ throughput/total_tokens=75,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=394/500000]
+ train/ActionNoiseL2Loss=0.3868
+ throughput/total_tokens=75,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=395/500000]
+ train/ActionNoiseL2Loss=0.3646
+ throughput/total_tokens=75,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=396/500000]
+ train/ActionNoiseL2Loss=0.2624
+ throughput/total_tokens=76,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=397/500000]
+ train/ActionNoiseL2Loss=0.3863
+ throughput/total_tokens=76,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=398/500000]
+ train/ActionNoiseL2Loss=0.2542
+ throughput/total_tokens=76,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=399/500000]
+ train/ActionNoiseL2Loss=0.3139
+ throughput/total_tokens=76,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=400/500000]
+ optim/total_grad_norm=7.841
+ train/ActionNoiseL2Loss=0.2739
+ throughput/total_tokens=76,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=401/500000]
+ train/ActionNoiseL2Loss=0.2423
+ throughput/total_tokens=76,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=402/500000]
+ train/ActionNoiseL2Loss=0.2580
+ throughput/total_tokens=77,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=403/500000]
+ train/ActionNoiseL2Loss=0.2315
+ throughput/total_tokens=77,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=404/500000]
+ train/ActionNoiseL2Loss=0.3276
+ throughput/total_tokens=77,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=405/500000]
+ train/ActionNoiseL2Loss=0.2080
+ throughput/total_tokens=77,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=406/500000]
+ train/ActionNoiseL2Loss=0.2571
+ throughput/total_tokens=77,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=407/500000]
+ train/ActionNoiseL2Loss=0.3259
+ throughput/total_tokens=78,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=408/500000]
+ train/ActionNoiseL2Loss=0.2419
+ throughput/total_tokens=78,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=409/500000]
+ train/ActionNoiseL2Loss=0.3831
+ throughput/total_tokens=78,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=410/500000]
+ train/ActionNoiseL2Loss=0.3609
+ throughput/total_tokens=78,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=411/500000]
+ train/ActionNoiseL2Loss=0.2860
+ throughput/total_tokens=78,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=412/500000]
+ train/ActionNoiseL2Loss=0.3700
+ throughput/total_tokens=79,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=413/500000]
+ train/ActionNoiseL2Loss=0.2511
+ throughput/total_tokens=79,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=414/500000]
+ train/ActionNoiseL2Loss=0.2850
+ throughput/total_tokens=79,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=415/500000]
+ train/ActionNoiseL2Loss=0.2960
+ throughput/total_tokens=79,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=416/500000]
+ train/ActionNoiseL2Loss=0.3845
+ throughput/total_tokens=79,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=417/500000]
+ train/ActionNoiseL2Loss=0.2874
+ throughput/total_tokens=80,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=418/500000]
+ train/ActionNoiseL2Loss=0.2419
+ throughput/total_tokens=80,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=419/500000]
+ train/ActionNoiseL2Loss=0.4047
+ throughput/total_tokens=80,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=420/500000]
+ optim/total_grad_norm=11.53
+ train/ActionNoiseL2Loss=0.4161
+ throughput/total_tokens=80,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=421/500000]
+ train/ActionNoiseL2Loss=0.3622
+ throughput/total_tokens=80,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=422/500000]
+ train/ActionNoiseL2Loss=0.2527
+ throughput/total_tokens=81,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=423/500000]
+ train/ActionNoiseL2Loss=0.2852
+ throughput/total_tokens=81,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=424/500000]
+ train/ActionNoiseL2Loss=0.2511
+ throughput/total_tokens=81,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=425/500000]
+ train/ActionNoiseL2Loss=0.3251
+ throughput/total_tokens=81,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=426/500000]
+ train/ActionNoiseL2Loss=0.3073
+ throughput/total_tokens=81,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=427/500000]
+ train/ActionNoiseL2Loss=0.2770
+ throughput/total_tokens=81,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=428/500000]
+ train/ActionNoiseL2Loss=0.2996
+ throughput/total_tokens=82,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=429/500000]
+ train/ActionNoiseL2Loss=0.3403
+ throughput/total_tokens=82,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=430/500000]
+ train/ActionNoiseL2Loss=0.2132
+ throughput/total_tokens=82,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=431/500000]
+ train/ActionNoiseL2Loss=0.2364
+ throughput/total_tokens=82,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=432/500000]
+ train/ActionNoiseL2Loss=0.3104
+ throughput/total_tokens=82,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=433/500000]
+ train/ActionNoiseL2Loss=0.2967
+ throughput/total_tokens=83,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=434/500000]
+ train/ActionNoiseL2Loss=0.2113
+ throughput/total_tokens=83,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=435/500000]
+ train/ActionNoiseL2Loss=0.2681
+ throughput/total_tokens=83,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=436/500000]
+ train/ActionNoiseL2Loss=0.2964
+ throughput/total_tokens=83,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=437/500000]
+ train/ActionNoiseL2Loss=0.4102
+ throughput/total_tokens=83,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=438/500000]
+ train/ActionNoiseL2Loss=0.2661
+ throughput/total_tokens=84,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=439/500000]
+ train/ActionNoiseL2Loss=0.2650
+ throughput/total_tokens=84,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=440/500000]
+ optim/total_grad_norm=8.932
+ train/ActionNoiseL2Loss=0.2933
+ throughput/total_tokens=84,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=441/500000]
+ train/ActionNoiseL2Loss=0.2863
+ throughput/total_tokens=84,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=442/500000]
+ train/ActionNoiseL2Loss=0.3061
+ throughput/total_tokens=84,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=443/500000]
+ train/ActionNoiseL2Loss=0.3584
+ throughput/total_tokens=85,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=444/500000]
+ train/ActionNoiseL2Loss=0.3150
+ throughput/total_tokens=85,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=445/500000]
+ train/ActionNoiseL2Loss=0.3488
+ throughput/total_tokens=85,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=446/500000]
+ train/ActionNoiseL2Loss=0.2728
+ throughput/total_tokens=85,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=447/500000]
+ train/ActionNoiseL2Loss=0.3229
+ throughput/total_tokens=85,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=448/500000]
+ train/ActionNoiseL2Loss=0.3392
+ throughput/total_tokens=86,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=449/500000]
+ train/ActionNoiseL2Loss=0.2778
+ throughput/total_tokens=86,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=450/500000]
+ train/ActionNoiseL2Loss=0.2838
+ throughput/total_tokens=86,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=451/500000]
+ train/ActionNoiseL2Loss=0.3352
+ throughput/total_tokens=86,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=452/500000]
+ train/ActionNoiseL2Loss=0.3046
+ throughput/total_tokens=86,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=453/500000]
+ train/ActionNoiseL2Loss=0.3866
+ throughput/total_tokens=86,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=454/500000]
+ train/ActionNoiseL2Loss=0.2856
+ throughput/total_tokens=87,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=455/500000]
+ train/ActionNoiseL2Loss=0.3923
+ throughput/total_tokens=87,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=456/500000]
+ train/ActionNoiseL2Loss=0.4017
+ throughput/total_tokens=87,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=457/500000]
+ train/ActionNoiseL2Loss=0.2861
+ throughput/total_tokens=87,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=458/500000]
+ train/ActionNoiseL2Loss=0.3301
+ throughput/total_tokens=87,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=459/500000]
+ train/ActionNoiseL2Loss=0.1926
+ throughput/total_tokens=88,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=460/500000]
+ optim/total_grad_norm=10.07
+ train/ActionNoiseL2Loss=0.3836
+ throughput/total_tokens=88,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=461/500000]
+ train/ActionNoiseL2Loss=0.3428
+ throughput/total_tokens=88,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=462/500000]
+ train/ActionNoiseL2Loss=0.3275
+ throughput/total_tokens=88,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=463/500000]
+ train/ActionNoiseL2Loss=0.2877
+ throughput/total_tokens=88,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=464/500000]
+ train/ActionNoiseL2Loss=0.3204
+ throughput/total_tokens=89,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=465/500000]
+ train/ActionNoiseL2Loss=0.2209
+ throughput/total_tokens=89,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=466/500000]
+ train/ActionNoiseL2Loss=0.2192
+ throughput/total_tokens=89,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=467/500000]
+ train/ActionNoiseL2Loss=0.2571
+ throughput/total_tokens=89,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=468/500000]
+ train/ActionNoiseL2Loss=0.3978
+ throughput/total_tokens=89,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=469/500000]
+ train/ActionNoiseL2Loss=0.2530
+ throughput/total_tokens=90,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=470/500000]
+ train/ActionNoiseL2Loss=0.3173
+ throughput/total_tokens=90,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=471/500000]
+ train/ActionNoiseL2Loss=0.2203
+ throughput/total_tokens=90,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=472/500000]
+ train/ActionNoiseL2Loss=0.2513
+ throughput/total_tokens=90,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=473/500000]
+ train/ActionNoiseL2Loss=0.3132
+ throughput/total_tokens=90,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=474/500000]
+ train/ActionNoiseL2Loss=0.2983
+ throughput/total_tokens=91,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=475/500000]
+ train/ActionNoiseL2Loss=0.2248
+ throughput/total_tokens=91,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=476/500000]
+ train/ActionNoiseL2Loss=0.3063
+ throughput/total_tokens=91,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=477/500000]
+ train/ActionNoiseL2Loss=0.2842
+ throughput/total_tokens=91,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=478/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=91,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=479/500000]
+ train/ActionNoiseL2Loss=0.3143
+ throughput/total_tokens=91,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=480/500000]
+ optim/total_grad_norm=7.446
+ train/ActionNoiseL2Loss=0.2562
+ throughput/total_tokens=92,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=481/500000]
+ train/ActionNoiseL2Loss=0.3228
+ throughput/total_tokens=92,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=482/500000]
+ train/ActionNoiseL2Loss=0.2439
+ throughput/total_tokens=92,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=483/500000]
+ train/ActionNoiseL2Loss=0.3545
+ throughput/total_tokens=92,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=484/500000]
+ train/ActionNoiseL2Loss=0.2051
+ throughput/total_tokens=92,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=485/500000]
+ train/ActionNoiseL2Loss=0.2719
+ throughput/total_tokens=93,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=486/500000]
+ train/ActionNoiseL2Loss=0.2380
+ throughput/total_tokens=93,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=487/500000]
+ train/ActionNoiseL2Loss=0.2509
+ throughput/total_tokens=93,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=488/500000]
+ train/ActionNoiseL2Loss=0.2634
+ throughput/total_tokens=93,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=489/500000]
+ train/ActionNoiseL2Loss=0.2827
+ throughput/total_tokens=93,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=490/500000]
+ train/ActionNoiseL2Loss=0.2570
+ throughput/total_tokens=94,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+[step=491/500000]
+ train/ActionNoiseL2Loss=0.2255
+ throughput/total_tokens=94,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=492/500000]
+ train/ActionNoiseL2Loss=0.3273
+ throughput/total_tokens=94,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=493/500000]
+ train/ActionNoiseL2Loss=0.2641
+ throughput/total_tokens=94,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=494/500000]
+ train/ActionNoiseL2Loss=0.2728
+ throughput/total_tokens=94,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=495/500000]
+ train/ActionNoiseL2Loss=0.3022
+ throughput/total_tokens=95,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=496/500000]
+ train/ActionNoiseL2Loss=0.3136
+ throughput/total_tokens=95,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=497/500000]
+ train/ActionNoiseL2Loss=0.2375
+ throughput/total_tokens=95,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=498/500000]
+ train/ActionNoiseL2Loss=0.3089
+ throughput/total_tokens=95,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=499/500000]
+ train/ActionNoiseL2Loss=0.2655
+ throughput/total_tokens=95,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=500/500000]
+ optim/total_grad_norm=9.060
+ train/ActionNoiseL2Loss=0.2388
+ throughput/total_tokens=96,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,466
+10/02 [19:39:51] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109
+ FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and
+ set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc:
+ https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial:
+ https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html .
+ warnings.warn(
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109
+ `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object
+ collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use
+ `_device_capability(group)`.
+ warnings.warn(
+
+10/02 [19:39:53] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ local_shape = tensor.shape
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.shape,
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.dtype,
+
+10/02 [19:39:57] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109
+ instead and we are deprecating ShardedTensor.
+ result = torch_func_method(public_api, types, args, kwargs)
+
+10/02 [19:40:23] INFO | >> Saving config... checkpoint.py:608
+10/02 [19:41:02] INFO | >> Saving model state... checkpoint.py:796
+10/02 [19:42:16] INFO | >> Saving optim state... checkpoint.py:811
+10/02 [19:43:49] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=501/500000]
+ train/ActionNoiseL2Loss=0.3328
+ throughput/total_tokens=96,192,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=502/500000]
+ train/ActionNoiseL2Loss=0.2553
+ throughput/total_tokens=96,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=503/500000]
+ train/ActionNoiseL2Loss=0.3348
+ throughput/total_tokens=96,576,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=504/500000]
+ train/ActionNoiseL2Loss=0.4767
+ throughput/total_tokens=96,768,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=505/500000]
+ train/ActionNoiseL2Loss=0.3529
+ throughput/total_tokens=96,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=506/500000]
+ train/ActionNoiseL2Loss=0.2405
+ throughput/total_tokens=97,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=507/500000]
+ train/ActionNoiseL2Loss=0.2319
+ throughput/total_tokens=97,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=508/500000]
+ train/ActionNoiseL2Loss=0.2796
+ throughput/total_tokens=97,536,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=509/500000]
+ train/ActionNoiseL2Loss=0.3362
+ throughput/total_tokens=97,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=510/500000]
+ train/ActionNoiseL2Loss=0.2681
+ throughput/total_tokens=97,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=511/500000]
+ train/ActionNoiseL2Loss=0.2917
+ throughput/total_tokens=98,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=512/500000]
+ train/ActionNoiseL2Loss=0.3305
+ throughput/total_tokens=98,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=513/500000]
+ train/ActionNoiseL2Loss=0.2778
+ throughput/total_tokens=98,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=514/500000]
+ train/ActionNoiseL2Loss=0.2682
+ throughput/total_tokens=98,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=515/500000]
+ train/ActionNoiseL2Loss=0.2838
+ throughput/total_tokens=98,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=516/500000]
+ train/ActionNoiseL2Loss=0.2553
+ throughput/total_tokens=99,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=517/500000]
+ train/ActionNoiseL2Loss=0.2073
+ throughput/total_tokens=99,264,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=518/500000]
+ train/ActionNoiseL2Loss=0.2588
+ throughput/total_tokens=99,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=519/500000]
+ train/ActionNoiseL2Loss=0.5064
+ throughput/total_tokens=99,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=520/500000]
+ optim/total_grad_norm=8.741
+ train/ActionNoiseL2Loss=0.2557
+ throughput/total_tokens=99,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=521/500000]
+ train/ActionNoiseL2Loss=0.2699
+ throughput/total_tokens=100,032,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=522/500000]
+ train/ActionNoiseL2Loss=0.1823
+ throughput/total_tokens=100,224,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=523/500000]
+ train/ActionNoiseL2Loss=0.2570
+ throughput/total_tokens=100,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=524/500000]
+ train/ActionNoiseL2Loss=0.3633
+ throughput/total_tokens=100,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=525/500000]
+ train/ActionNoiseL2Loss=0.3860
+ throughput/total_tokens=100,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=526/500000]
+ train/ActionNoiseL2Loss=0.2334
+ throughput/total_tokens=100,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=527/500000]
+ train/ActionNoiseL2Loss=0.3603
+ throughput/total_tokens=101,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=528/500000]
+ train/ActionNoiseL2Loss=0.2067
+ throughput/total_tokens=101,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=529/500000]
+ train/ActionNoiseL2Loss=0.2415
+ throughput/total_tokens=101,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=530/500000]
+ train/ActionNoiseL2Loss=0.4407
+ throughput/total_tokens=101,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=531/500000]
+ train/ActionNoiseL2Loss=0.2209
+ throughput/total_tokens=101,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=532/500000]
+ train/ActionNoiseL2Loss=0.3580
+ throughput/total_tokens=102,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=533/500000]
+ train/ActionNoiseL2Loss=0.5081
+ throughput/total_tokens=102,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=534/500000]
+ train/ActionNoiseL2Loss=0.3284
+ throughput/total_tokens=102,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=535/500000]
+ train/ActionNoiseL2Loss=0.4212
+ throughput/total_tokens=102,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=536/500000]
+ train/ActionNoiseL2Loss=0.3300
+ throughput/total_tokens=102,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=537/500000]
+ train/ActionNoiseL2Loss=0.5227
+ throughput/total_tokens=103,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=538/500000]
+ train/ActionNoiseL2Loss=0.3758
+ throughput/total_tokens=103,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=539/500000]
+ train/ActionNoiseL2Loss=0.2097
+ throughput/total_tokens=103,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=540/500000]
+ optim/total_grad_norm=7.873
+ train/ActionNoiseL2Loss=0.2272
+ throughput/total_tokens=103,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=541/500000]
+ train/ActionNoiseL2Loss=0.2330
+ throughput/total_tokens=103,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=542/500000]
+ train/ActionNoiseL2Loss=0.2415
+ throughput/total_tokens=104,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=543/500000]
+ train/ActionNoiseL2Loss=0.2216
+ throughput/total_tokens=104,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=544/500000]
+ train/ActionNoiseL2Loss=0.2712
+ throughput/total_tokens=104,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=545/500000]
+ train/ActionNoiseL2Loss=0.2959
+ throughput/total_tokens=104,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=546/500000]
+ train/ActionNoiseL2Loss=0.2407
+ throughput/total_tokens=104,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=547/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=105,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=548/500000]
+ train/ActionNoiseL2Loss=0.2988
+ throughput/total_tokens=105,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=549/500000]
+ train/ActionNoiseL2Loss=0.1897
+ throughput/total_tokens=105,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=550/500000]
+ train/ActionNoiseL2Loss=0.3236
+ throughput/total_tokens=105,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=551/500000]
+ train/ActionNoiseL2Loss=0.2795
+ throughput/total_tokens=105,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=552/500000]
+ train/ActionNoiseL2Loss=0.2107
+ throughput/total_tokens=105,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=553/500000]
+ train/ActionNoiseL2Loss=0.1956
+ throughput/total_tokens=106,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=554/500000]
+ train/ActionNoiseL2Loss=0.2836
+ throughput/total_tokens=106,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=555/500000]
+ train/ActionNoiseL2Loss=0.3709
+ throughput/total_tokens=106,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=556/500000]
+ train/ActionNoiseL2Loss=0.2055
+ throughput/total_tokens=106,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=557/500000]
+ train/ActionNoiseL2Loss=0.2787
+ throughput/total_tokens=106,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=558/500000]
+ train/ActionNoiseL2Loss=0.3750
+ throughput/total_tokens=107,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=559/500000]
+ train/ActionNoiseL2Loss=0.3164
+ throughput/total_tokens=107,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=560/500000]
+ optim/total_grad_norm=6.841
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=107,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=561/500000]
+ train/ActionNoiseL2Loss=0.3386
+ throughput/total_tokens=107,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=562/500000]
+ train/ActionNoiseL2Loss=0.2199
+ throughput/total_tokens=107,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=563/500000]
+ train/ActionNoiseL2Loss=0.2957
+ throughput/total_tokens=108,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=564/500000]
+ train/ActionNoiseL2Loss=0.3464
+ throughput/total_tokens=108,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=565/500000]
+ train/ActionNoiseL2Loss=0.2552
+ throughput/total_tokens=108,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=566/500000]
+ train/ActionNoiseL2Loss=0.1931
+ throughput/total_tokens=108,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=567/500000]
+ train/ActionNoiseL2Loss=0.2356
+ throughput/total_tokens=108,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=568/500000]
+ train/ActionNoiseL2Loss=0.3947
+ throughput/total_tokens=109,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=569/500000]
+ train/ActionNoiseL2Loss=0.1702
+ throughput/total_tokens=109,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=570/500000]
+ train/ActionNoiseL2Loss=0.2379
+ throughput/total_tokens=109,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=571/500000]
+ train/ActionNoiseL2Loss=0.2396
+ throughput/total_tokens=109,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=572/500000]
+ train/ActionNoiseL2Loss=0.1823
+ throughput/total_tokens=109,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=573/500000]
+ train/ActionNoiseL2Loss=0.2376
+ throughput/total_tokens=110,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=574/500000]
+ train/ActionNoiseL2Loss=0.1660
+ throughput/total_tokens=110,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=575/500000]
+ train/ActionNoiseL2Loss=0.2488
+ throughput/total_tokens=110,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=576/500000]
+ train/ActionNoiseL2Loss=0.2515
+ throughput/total_tokens=110,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=577/500000]
+ train/ActionNoiseL2Loss=0.2474
+ throughput/total_tokens=110,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=578/500000]
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=110,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=579/500000]
+ train/ActionNoiseL2Loss=0.3190
+ throughput/total_tokens=111,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=580/500000]
+ optim/total_grad_norm=8.227
+ train/ActionNoiseL2Loss=0.3296
+ throughput/total_tokens=111,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=581/500000]
+ train/ActionNoiseL2Loss=0.4610
+ throughput/total_tokens=111,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=582/500000]
+ train/ActionNoiseL2Loss=0.2232
+ throughput/total_tokens=111,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=583/500000]
+ train/ActionNoiseL2Loss=0.2476
+ throughput/total_tokens=111,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=584/500000]
+ train/ActionNoiseL2Loss=0.3111
+ throughput/total_tokens=112,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=585/500000]
+ train/ActionNoiseL2Loss=0.2349
+ throughput/total_tokens=112,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=586/500000]
+ train/ActionNoiseL2Loss=0.2729
+ throughput/total_tokens=112,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=587/500000]
+ train/ActionNoiseL2Loss=0.2935
+ throughput/total_tokens=112,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=588/500000]
+ train/ActionNoiseL2Loss=0.3345
+ throughput/total_tokens=112,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=589/500000]
+ train/ActionNoiseL2Loss=0.4098
+ throughput/total_tokens=113,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=590/500000]
+ train/ActionNoiseL2Loss=0.3950
+ throughput/total_tokens=113,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=591/500000]
+ train/ActionNoiseL2Loss=0.2369
+ throughput/total_tokens=113,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=592/500000]
+ train/ActionNoiseL2Loss=0.3249
+ throughput/total_tokens=113,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=593/500000]
+ train/ActionNoiseL2Loss=0.3884
+ throughput/total_tokens=113,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=594/500000]
+ train/ActionNoiseL2Loss=0.3567
+ throughput/total_tokens=114,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=595/500000]
+ train/ActionNoiseL2Loss=0.4159
+ throughput/total_tokens=114,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=596/500000]
+ train/ActionNoiseL2Loss=0.2336
+ throughput/total_tokens=114,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=597/500000]
+ train/ActionNoiseL2Loss=0.3265
+ throughput/total_tokens=114,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=598/500000]
+ train/ActionNoiseL2Loss=0.1929
+ throughput/total_tokens=114,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=599/500000]
+ train/ActionNoiseL2Loss=0.3240
+ throughput/total_tokens=115,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=600/500000]
+ optim/total_grad_norm=7.758
+ train/ActionNoiseL2Loss=0.2419
+ throughput/total_tokens=115,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=601/500000]
+ train/ActionNoiseL2Loss=0.3631
+ throughput/total_tokens=115,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=602/500000]
+ train/ActionNoiseL2Loss=0.3025
+ throughput/total_tokens=115,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=603/500000]
+ train/ActionNoiseL2Loss=0.2049
+ throughput/total_tokens=115,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=604/500000]
+ train/ActionNoiseL2Loss=0.2867
+ throughput/total_tokens=115,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=605/500000]
+ train/ActionNoiseL2Loss=0.2510
+ throughput/total_tokens=116,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=606/500000]
+ train/ActionNoiseL2Loss=0.3164
+ throughput/total_tokens=116,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=607/500000]
+ train/ActionNoiseL2Loss=0.2680
+ throughput/total_tokens=116,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=608/500000]
+ train/ActionNoiseL2Loss=0.2115
+ throughput/total_tokens=116,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=609/500000]
+ train/ActionNoiseL2Loss=0.2995
+ throughput/total_tokens=116,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=610/500000]
+ train/ActionNoiseL2Loss=0.2566
+ throughput/total_tokens=117,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=611/500000]
+ train/ActionNoiseL2Loss=0.2267
+ throughput/total_tokens=117,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=612/500000]
+ train/ActionNoiseL2Loss=0.4176
+ throughput/total_tokens=117,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=613/500000]
+ train/ActionNoiseL2Loss=0.1902
+ throughput/total_tokens=117,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=614/500000]
+ train/ActionNoiseL2Loss=0.1721
+ throughput/total_tokens=117,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=615/500000]
+ train/ActionNoiseL2Loss=0.2551
+ throughput/total_tokens=118,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=616/500000]
+ train/ActionNoiseL2Loss=0.3635
+ throughput/total_tokens=118,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=617/500000]
+ train/ActionNoiseL2Loss=0.2558
+ throughput/total_tokens=118,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=618/500000]
+ train/ActionNoiseL2Loss=0.2373
+ throughput/total_tokens=118,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=619/500000]
+ train/ActionNoiseL2Loss=0.3431
+ throughput/total_tokens=118,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=620/500000]
+ optim/total_grad_norm=6.040
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=119,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=621/500000]
+ train/ActionNoiseL2Loss=0.2705
+ throughput/total_tokens=119,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=622/500000]
+ train/ActionNoiseL2Loss=0.3810
+ throughput/total_tokens=119,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=623/500000]
+ train/ActionNoiseL2Loss=0.2869
+ throughput/total_tokens=119,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=624/500000]
+ train/ActionNoiseL2Loss=0.2977
+ throughput/total_tokens=119,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=625/500000]
+ train/ActionNoiseL2Loss=0.2803
+ throughput/total_tokens=120,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=626/500000]
+ train/ActionNoiseL2Loss=0.2114
+ throughput/total_tokens=120,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=627/500000]
+ train/ActionNoiseL2Loss=0.2267
+ throughput/total_tokens=120,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=628/500000]
+ train/ActionNoiseL2Loss=0.4299
+ throughput/total_tokens=120,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=629/500000]
+ train/ActionNoiseL2Loss=0.3360
+ throughput/total_tokens=120,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=630/500000]
+ train/ActionNoiseL2Loss=0.3646
+ throughput/total_tokens=120,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=631/500000]
+ train/ActionNoiseL2Loss=0.1933
+ throughput/total_tokens=121,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=632/500000]
+ train/ActionNoiseL2Loss=0.3859
+ throughput/total_tokens=121,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=633/500000]
+ train/ActionNoiseL2Loss=0.2040
+ throughput/total_tokens=121,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=634/500000]
+ train/ActionNoiseL2Loss=0.2438
+ throughput/total_tokens=121,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=635/500000]
+ train/ActionNoiseL2Loss=0.2405
+ throughput/total_tokens=121,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=636/500000]
+ train/ActionNoiseL2Loss=0.3503
+ throughput/total_tokens=122,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=637/500000]
+ train/ActionNoiseL2Loss=0.2062
+ throughput/total_tokens=122,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=638/500000]
+ train/ActionNoiseL2Loss=0.3186
+ throughput/total_tokens=122,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=639/500000]
+ train/ActionNoiseL2Loss=0.2072
+ throughput/total_tokens=122,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=640/500000]
+ optim/total_grad_norm=6.977
+ train/ActionNoiseL2Loss=0.2242
+ throughput/total_tokens=122,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=641/500000]
+ train/ActionNoiseL2Loss=0.3083
+ throughput/total_tokens=123,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=642/500000]
+ train/ActionNoiseL2Loss=0.2830
+ throughput/total_tokens=123,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=643/500000]
+ train/ActionNoiseL2Loss=0.2027
+ throughput/total_tokens=123,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=644/500000]
+ train/ActionNoiseL2Loss=0.3055
+ throughput/total_tokens=123,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=645/500000]
+ train/ActionNoiseL2Loss=0.2608
+ throughput/total_tokens=123,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=646/500000]
+ train/ActionNoiseL2Loss=0.2430
+ throughput/total_tokens=124,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=647/500000]
+ train/ActionNoiseL2Loss=0.2181
+ throughput/total_tokens=124,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=648/500000]
+ train/ActionNoiseL2Loss=0.1677
+ throughput/total_tokens=124,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=649/500000]
+ train/ActionNoiseL2Loss=0.2714
+ throughput/total_tokens=124,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=650/500000]
+ train/ActionNoiseL2Loss=0.2614
+ throughput/total_tokens=124,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=651/500000]
+ train/ActionNoiseL2Loss=0.1871
+ throughput/total_tokens=124,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=652/500000]
+ train/ActionNoiseL2Loss=0.1475
+ throughput/total_tokens=125,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=653/500000]
+ train/ActionNoiseL2Loss=0.1805
+ throughput/total_tokens=125,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=654/500000]
+ train/ActionNoiseL2Loss=0.2524
+ throughput/total_tokens=125,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=655/500000]
+ train/ActionNoiseL2Loss=0.2590
+ throughput/total_tokens=125,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=656/500000]
+ train/ActionNoiseL2Loss=0.2232
+ throughput/total_tokens=125,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=657/500000]
+ train/ActionNoiseL2Loss=0.2053
+ throughput/total_tokens=126,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=658/500000]
+ train/ActionNoiseL2Loss=0.2616
+ throughput/total_tokens=126,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=659/500000]
+ train/ActionNoiseL2Loss=0.2101
+ throughput/total_tokens=126,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=660/500000]
+ optim/total_grad_norm=7.312
+ train/ActionNoiseL2Loss=0.3093
+ throughput/total_tokens=126,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=661/500000]
+ train/ActionNoiseL2Loss=0.3176
+ throughput/total_tokens=126,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=662/500000]
+ train/ActionNoiseL2Loss=0.3066
+ throughput/total_tokens=127,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=663/500000]
+ train/ActionNoiseL2Loss=0.3001
+ throughput/total_tokens=127,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=664/500000]
+ train/ActionNoiseL2Loss=0.4075
+ throughput/total_tokens=127,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=665/500000]
+ train/ActionNoiseL2Loss=0.3480
+ throughput/total_tokens=127,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=666/500000]
+ train/ActionNoiseL2Loss=0.2537
+ throughput/total_tokens=127,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=667/500000]
+ train/ActionNoiseL2Loss=0.3933
+ throughput/total_tokens=128,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=668/500000]
+ train/ActionNoiseL2Loss=0.1810
+ throughput/total_tokens=128,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=669/500000]
+ train/ActionNoiseL2Loss=0.2523
+ throughput/total_tokens=128,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=670/500000]
+ train/ActionNoiseL2Loss=0.3395
+ throughput/total_tokens=128,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=671/500000]
+ train/ActionNoiseL2Loss=0.2119
+ throughput/total_tokens=128,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=672/500000]
+ train/ActionNoiseL2Loss=0.2078
+ throughput/total_tokens=129,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=673/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=129,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=674/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=129,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=675/500000]
+ train/ActionNoiseL2Loss=0.2995
+ throughput/total_tokens=129,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=676/500000]
+ train/ActionNoiseL2Loss=0.2947
+ throughput/total_tokens=129,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=677/500000]
+ train/ActionNoiseL2Loss=0.1982
+ throughput/total_tokens=129,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=678/500000]
+ train/ActionNoiseL2Loss=0.1820
+ throughput/total_tokens=130,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=679/500000]
+ train/ActionNoiseL2Loss=0.2382
+ throughput/total_tokens=130,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=680/500000]
+ optim/total_grad_norm=9.073
+ train/ActionNoiseL2Loss=0.3660
+ throughput/total_tokens=130,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=681/500000]
+ train/ActionNoiseL2Loss=0.3286
+ throughput/total_tokens=130,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=682/500000]
+ train/ActionNoiseL2Loss=0.2286
+ throughput/total_tokens=130,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=683/500000]
+ train/ActionNoiseL2Loss=0.1721
+ throughput/total_tokens=131,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=684/500000]
+ train/ActionNoiseL2Loss=0.4011
+ throughput/total_tokens=131,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=685/500000]
+ train/ActionNoiseL2Loss=0.2644
+ throughput/total_tokens=131,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=686/500000]
+ train/ActionNoiseL2Loss=0.1929
+ throughput/total_tokens=131,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=687/500000]
+ train/ActionNoiseL2Loss=0.1561
+ throughput/total_tokens=131,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=688/500000]
+ train/ActionNoiseL2Loss=0.2681
+ throughput/total_tokens=132,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=689/500000]
+ train/ActionNoiseL2Loss=0.2431
+ throughput/total_tokens=132,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=690/500000]
+ train/ActionNoiseL2Loss=0.3193
+ throughput/total_tokens=132,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=691/500000]
+ train/ActionNoiseL2Loss=0.2109
+ throughput/total_tokens=132,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=692/500000]
+ train/ActionNoiseL2Loss=0.3125
+ throughput/total_tokens=132,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=693/500000]
+ train/ActionNoiseL2Loss=0.3170
+ throughput/total_tokens=133,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=694/500000]
+ train/ActionNoiseL2Loss=0.1769
+ throughput/total_tokens=133,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=695/500000]
+ train/ActionNoiseL2Loss=0.1842
+ throughput/total_tokens=133,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=696/500000]
+ train/ActionNoiseL2Loss=0.4244
+ throughput/total_tokens=133,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=697/500000]
+ train/ActionNoiseL2Loss=0.2434
+ throughput/total_tokens=133,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=698/500000]
+ train/ActionNoiseL2Loss=0.2497
+ throughput/total_tokens=134,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=699/500000]
+ train/ActionNoiseL2Loss=0.2806
+ throughput/total_tokens=134,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=700/500000]
+ optim/total_grad_norm=7.796
+ train/ActionNoiseL2Loss=0.3091
+ throughput/total_tokens=134,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=701/500000]
+ train/ActionNoiseL2Loss=0.1904
+ throughput/total_tokens=134,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=702/500000]
+ train/ActionNoiseL2Loss=0.3239
+ throughput/total_tokens=134,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=703/500000]
+ train/ActionNoiseL2Loss=0.2105
+ throughput/total_tokens=134,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=704/500000]
+ train/ActionNoiseL2Loss=0.1874
+ throughput/total_tokens=135,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=705/500000]
+ train/ActionNoiseL2Loss=0.2722
+ throughput/total_tokens=135,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=706/500000]
+ train/ActionNoiseL2Loss=0.2387
+ throughput/total_tokens=135,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=707/500000]
+ train/ActionNoiseL2Loss=0.2847
+ throughput/total_tokens=135,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=708/500000]
+ train/ActionNoiseL2Loss=0.2292
+ throughput/total_tokens=135,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=709/500000]
+ train/ActionNoiseL2Loss=0.3023
+ throughput/total_tokens=136,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=710/500000]
+ train/ActionNoiseL2Loss=0.3217
+ throughput/total_tokens=136,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=711/500000]
+ train/ActionNoiseL2Loss=0.2311
+ throughput/total_tokens=136,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=712/500000]
+ train/ActionNoiseL2Loss=0.1855
+ throughput/total_tokens=136,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=713/500000]
+ train/ActionNoiseL2Loss=0.2847
+ throughput/total_tokens=136,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=714/500000]
+ train/ActionNoiseL2Loss=0.2626
+ throughput/total_tokens=137,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=715/500000]
+ train/ActionNoiseL2Loss=0.1949
+ throughput/total_tokens=137,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=716/500000]
+ train/ActionNoiseL2Loss=0.1921
+ throughput/total_tokens=137,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=717/500000]
+ train/ActionNoiseL2Loss=0.2520
+ throughput/total_tokens=137,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=718/500000]
+ train/ActionNoiseL2Loss=0.3474
+ throughput/total_tokens=137,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=719/500000]
+ train/ActionNoiseL2Loss=0.1905
+ throughput/total_tokens=138,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=720/500000]
+ optim/total_grad_norm=7.241
+ train/ActionNoiseL2Loss=0.2675
+ throughput/total_tokens=138,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=721/500000]
+ train/ActionNoiseL2Loss=0.2477
+ throughput/total_tokens=138,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=722/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=138,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=723/500000]
+ train/ActionNoiseL2Loss=0.3515
+ throughput/total_tokens=138,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=724/500000]
+ train/ActionNoiseL2Loss=0.2337
+ throughput/total_tokens=139,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=725/500000]
+ train/ActionNoiseL2Loss=0.2226
+ throughput/total_tokens=139,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=726/500000]
+ train/ActionNoiseL2Loss=0.1799
+ throughput/total_tokens=139,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=727/500000]
+ train/ActionNoiseL2Loss=0.2528
+ throughput/total_tokens=139,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=728/500000]
+ train/ActionNoiseL2Loss=0.2374
+ throughput/total_tokens=139,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=729/500000]
+ train/ActionNoiseL2Loss=0.2333
+ throughput/total_tokens=139,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=730/500000]
+ train/ActionNoiseL2Loss=0.2145
+ throughput/total_tokens=140,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=731/500000]
+ train/ActionNoiseL2Loss=0.1545
+ throughput/total_tokens=140,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=732/500000]
+ train/ActionNoiseL2Loss=0.1776
+ throughput/total_tokens=140,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=733/500000]
+ train/ActionNoiseL2Loss=0.2338
+ throughput/total_tokens=140,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=734/500000]
+ train/ActionNoiseL2Loss=0.2578
+ throughput/total_tokens=140,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=735/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=141,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=736/500000]
+ train/ActionNoiseL2Loss=0.1949
+ throughput/total_tokens=141,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=737/500000]
+ train/ActionNoiseL2Loss=0.1950
+ throughput/total_tokens=141,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=738/500000]
+ train/ActionNoiseL2Loss=0.2098
+ throughput/total_tokens=141,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=739/500000]
+ train/ActionNoiseL2Loss=0.3021
+ throughput/total_tokens=141,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=740/500000]
+ optim/total_grad_norm=6.854
+ train/ActionNoiseL2Loss=0.2588
+ throughput/total_tokens=142,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=741/500000]
+ train/ActionNoiseL2Loss=0.3000
+ throughput/total_tokens=142,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=742/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=142,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=743/500000]
+ train/ActionNoiseL2Loss=0.2239
+ throughput/total_tokens=142,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=744/500000]
+ train/ActionNoiseL2Loss=0.2490
+ throughput/total_tokens=142,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=745/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=143,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=746/500000]
+ train/ActionNoiseL2Loss=0.2088
+ throughput/total_tokens=143,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=747/500000]
+ train/ActionNoiseL2Loss=0.2499
+ throughput/total_tokens=143,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=748/500000]
+ train/ActionNoiseL2Loss=0.2483
+ throughput/total_tokens=143,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=749/500000]
+ train/ActionNoiseL2Loss=0.2081
+ throughput/total_tokens=143,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=750/500000]
+ train/ActionNoiseL2Loss=0.2246
+ throughput/total_tokens=144,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=751/500000]
+ train/ActionNoiseL2Loss=0.2537
+ throughput/total_tokens=144,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=752/500000]
+ train/ActionNoiseL2Loss=0.2755
+ throughput/total_tokens=144,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=753/500000]
+ train/ActionNoiseL2Loss=0.2425
+ throughput/total_tokens=144,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=754/500000]
+ train/ActionNoiseL2Loss=0.2037
+ throughput/total_tokens=144,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=755/500000]
+ train/ActionNoiseL2Loss=0.1949
+ throughput/total_tokens=144,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=756/500000]
+ train/ActionNoiseL2Loss=0.2561
+ throughput/total_tokens=145,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=757/500000]
+ train/ActionNoiseL2Loss=0.2416
+ throughput/total_tokens=145,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=758/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=145,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=759/500000]
+ train/ActionNoiseL2Loss=0.2509
+ throughput/total_tokens=145,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=760/500000]
+ optim/total_grad_norm=10.62
+ train/ActionNoiseL2Loss=0.4663
+ throughput/total_tokens=145,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=761/500000]
+ train/ActionNoiseL2Loss=0.1859
+ throughput/total_tokens=146,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=762/500000]
+ train/ActionNoiseL2Loss=0.4277
+ throughput/total_tokens=146,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=763/500000]
+ train/ActionNoiseL2Loss=0.2983
+ throughput/total_tokens=146,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=764/500000]
+ train/ActionNoiseL2Loss=0.3103
+ throughput/total_tokens=146,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=765/500000]
+ train/ActionNoiseL2Loss=0.3204
+ throughput/total_tokens=146,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=766/500000]
+ train/ActionNoiseL2Loss=0.3175
+ throughput/total_tokens=147,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=767/500000]
+ train/ActionNoiseL2Loss=0.1904
+ throughput/total_tokens=147,264,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=768/500000]
+ train/ActionNoiseL2Loss=0.2275
+ throughput/total_tokens=147,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=769/500000]
+ train/ActionNoiseL2Loss=0.2639
+ throughput/total_tokens=147,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=770/500000]
+ train/ActionNoiseL2Loss=0.2724
+ throughput/total_tokens=147,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=771/500000]
+ train/ActionNoiseL2Loss=0.2668
+ throughput/total_tokens=148,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=772/500000]
+ train/ActionNoiseL2Loss=0.2065
+ throughput/total_tokens=148,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=773/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=148,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=774/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=148,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=775/500000]
+ train/ActionNoiseL2Loss=0.1916
+ throughput/total_tokens=148,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=776/500000]
+ train/ActionNoiseL2Loss=0.3240
+ throughput/total_tokens=148,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=777/500000]
+ train/ActionNoiseL2Loss=0.2553
+ throughput/total_tokens=149,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=778/500000]
+ train/ActionNoiseL2Loss=0.2841
+ throughput/total_tokens=149,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=779/500000]
+ train/ActionNoiseL2Loss=0.3982
+ throughput/total_tokens=149,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=780/500000]
+ optim/total_grad_norm=6.680
+ train/ActionNoiseL2Loss=0.2971
+ throughput/total_tokens=149,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=781/500000]
+ train/ActionNoiseL2Loss=0.1911
+ throughput/total_tokens=149,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=782/500000]
+ train/ActionNoiseL2Loss=0.2933
+ throughput/total_tokens=150,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=783/500000]
+ train/ActionNoiseL2Loss=0.2698
+ throughput/total_tokens=150,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=784/500000]
+ train/ActionNoiseL2Loss=0.2986
+ throughput/total_tokens=150,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=785/500000]
+ train/ActionNoiseL2Loss=0.1505
+ throughput/total_tokens=150,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=786/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=150,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=787/500000]
+ train/ActionNoiseL2Loss=0.2880
+ throughput/total_tokens=151,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=788/500000]
+ train/ActionNoiseL2Loss=0.2158
+ throughput/total_tokens=151,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=789/500000]
+ train/ActionNoiseL2Loss=0.2811
+ throughput/total_tokens=151,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=790/500000]
+ train/ActionNoiseL2Loss=0.2626
+ throughput/total_tokens=151,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=791/500000]
+ train/ActionNoiseL2Loss=0.3922
+ throughput/total_tokens=151,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=792/500000]
+ train/ActionNoiseL2Loss=0.2556
+ throughput/total_tokens=152,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=793/500000]
+ train/ActionNoiseL2Loss=0.1846
+ throughput/total_tokens=152,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=794/500000]
+ train/ActionNoiseL2Loss=0.2666
+ throughput/total_tokens=152,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=795/500000]
+ train/ActionNoiseL2Loss=0.2567
+ throughput/total_tokens=152,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=796/500000]
+ train/ActionNoiseL2Loss=0.3170
+ throughput/total_tokens=152,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=797/500000]
+ train/ActionNoiseL2Loss=0.2299
+ throughput/total_tokens=153,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=798/500000]
+ train/ActionNoiseL2Loss=0.2778
+ throughput/total_tokens=153,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=799/500000]
+ train/ActionNoiseL2Loss=0.3602
+ throughput/total_tokens=153,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=800/500000]
+ optim/total_grad_norm=5.021
+ train/ActionNoiseL2Loss=0.1933
+ throughput/total_tokens=153,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=801/500000]
+ train/ActionNoiseL2Loss=0.2392
+ throughput/total_tokens=153,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=802/500000]
+ train/ActionNoiseL2Loss=0.2512
+ throughput/total_tokens=153,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=803/500000]
+ train/ActionNoiseL2Loss=0.2596
+ throughput/total_tokens=154,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=804/500000]
+ train/ActionNoiseL2Loss=0.2667
+ throughput/total_tokens=154,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=805/500000]
+ train/ActionNoiseL2Loss=0.1994
+ throughput/total_tokens=154,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=806/500000]
+ train/ActionNoiseL2Loss=0.2548
+ throughput/total_tokens=154,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=807/500000]
+ train/ActionNoiseL2Loss=0.2806
+ throughput/total_tokens=154,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=808/500000]
+ train/ActionNoiseL2Loss=0.2260
+ throughput/total_tokens=155,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=809/500000]
+ train/ActionNoiseL2Loss=0.2304
+ throughput/total_tokens=155,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=810/500000]
+ train/ActionNoiseL2Loss=0.1779
+ throughput/total_tokens=155,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=811/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=155,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=812/500000]
+ train/ActionNoiseL2Loss=0.3460
+ throughput/total_tokens=155,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=813/500000]
+ train/ActionNoiseL2Loss=0.2398
+ throughput/total_tokens=156,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=814/500000]
+ train/ActionNoiseL2Loss=0.1733
+ throughput/total_tokens=156,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=815/500000]
+ train/ActionNoiseL2Loss=0.2114
+ throughput/total_tokens=156,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=816/500000]
+ train/ActionNoiseL2Loss=0.3066
+ throughput/total_tokens=156,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=817/500000]
+ train/ActionNoiseL2Loss=0.2627
+ throughput/total_tokens=156,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=818/500000]
+ train/ActionNoiseL2Loss=0.2863
+ throughput/total_tokens=157,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=819/500000]
+ train/ActionNoiseL2Loss=0.2074
+ throughput/total_tokens=157,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=820/500000]
+ optim/total_grad_norm=8.369
+ train/ActionNoiseL2Loss=0.2595
+ throughput/total_tokens=157,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=821/500000]
+ train/ActionNoiseL2Loss=0.3279
+ throughput/total_tokens=157,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=822/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=157,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=823/500000]
+ train/ActionNoiseL2Loss=0.3072
+ throughput/total_tokens=158,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=824/500000]
+ train/ActionNoiseL2Loss=0.2829
+ throughput/total_tokens=158,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=825/500000]
+ train/ActionNoiseL2Loss=0.2810
+ throughput/total_tokens=158,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=826/500000]
+ train/ActionNoiseL2Loss=0.2791
+ throughput/total_tokens=158,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=827/500000]
+ train/ActionNoiseL2Loss=0.3056
+ throughput/total_tokens=158,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=828/500000]
+ train/ActionNoiseL2Loss=0.2029
+ throughput/total_tokens=158,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=829/500000]
+ train/ActionNoiseL2Loss=0.1966
+ throughput/total_tokens=159,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=830/500000]
+ train/ActionNoiseL2Loss=0.1967
+ throughput/total_tokens=159,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=831/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=159,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=832/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=159,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=833/500000]
+ train/ActionNoiseL2Loss=0.2537
+ throughput/total_tokens=159,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=834/500000]
+ train/ActionNoiseL2Loss=0.2977
+ throughput/total_tokens=160,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=835/500000]
+ train/ActionNoiseL2Loss=0.2150
+ throughput/total_tokens=160,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=836/500000]
+ train/ActionNoiseL2Loss=0.1740
+ throughput/total_tokens=160,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=837/500000]
+ train/ActionNoiseL2Loss=0.2421
+ throughput/total_tokens=160,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=838/500000]
+ train/ActionNoiseL2Loss=0.1778
+ throughput/total_tokens=160,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=839/500000]
+ train/ActionNoiseL2Loss=0.2562
+ throughput/total_tokens=161,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=840/500000]
+ optim/total_grad_norm=4.869
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=161,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=841/500000]
+ train/ActionNoiseL2Loss=0.3580
+ throughput/total_tokens=161,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=842/500000]
+ train/ActionNoiseL2Loss=0.2154
+ throughput/total_tokens=161,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=843/500000]
+ train/ActionNoiseL2Loss=0.1804
+ throughput/total_tokens=161,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=844/500000]
+ train/ActionNoiseL2Loss=0.2108
+ throughput/total_tokens=162,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=845/500000]
+ train/ActionNoiseL2Loss=0.1906
+ throughput/total_tokens=162,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=846/500000]
+ train/ActionNoiseL2Loss=0.2407
+ throughput/total_tokens=162,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=847/500000]
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=162,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=848/500000]
+ train/ActionNoiseL2Loss=0.1956
+ throughput/total_tokens=162,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=849/500000]
+ train/ActionNoiseL2Loss=0.2533
+ throughput/total_tokens=163,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=850/500000]
+ train/ActionNoiseL2Loss=0.2010
+ throughput/total_tokens=163,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=851/500000]
+ train/ActionNoiseL2Loss=0.1718
+ throughput/total_tokens=163,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=852/500000]
+ train/ActionNoiseL2Loss=0.2262
+ throughput/total_tokens=163,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=853/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=163,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=854/500000]
+ train/ActionNoiseL2Loss=0.2898
+ throughput/total_tokens=163,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=855/500000]
+ train/ActionNoiseL2Loss=0.4144
+ throughput/total_tokens=164,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=856/500000]
+ train/ActionNoiseL2Loss=0.3097
+ throughput/total_tokens=164,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=857/500000]
+ train/ActionNoiseL2Loss=0.2107
+ throughput/total_tokens=164,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=858/500000]
+ train/ActionNoiseL2Loss=0.1707
+ throughput/total_tokens=164,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=859/500000]
+ train/ActionNoiseL2Loss=0.4043
+ throughput/total_tokens=164,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=860/500000]
+ optim/total_grad_norm=8.877
+ train/ActionNoiseL2Loss=0.3019
+ throughput/total_tokens=165,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=861/500000]
+ train/ActionNoiseL2Loss=0.3810
+ throughput/total_tokens=165,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=862/500000]
+ train/ActionNoiseL2Loss=0.2101
+ throughput/total_tokens=165,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=863/500000]
+ train/ActionNoiseL2Loss=0.3485
+ throughput/total_tokens=165,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=864/500000]
+ train/ActionNoiseL2Loss=0.2889
+ throughput/total_tokens=165,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=865/500000]
+ train/ActionNoiseL2Loss=0.3084
+ throughput/total_tokens=166,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=866/500000]
+ train/ActionNoiseL2Loss=0.4669
+ throughput/total_tokens=166,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=867/500000]
+ train/ActionNoiseL2Loss=0.2945
+ throughput/total_tokens=166,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=868/500000]
+ train/ActionNoiseL2Loss=0.2559
+ throughput/total_tokens=166,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=869/500000]
+ train/ActionNoiseL2Loss=0.1591
+ throughput/total_tokens=166,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=870/500000]
+ train/ActionNoiseL2Loss=0.2450
+ throughput/total_tokens=167,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=871/500000]
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=167,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=872/500000]
+ train/ActionNoiseL2Loss=0.3345
+ throughput/total_tokens=167,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=873/500000]
+ train/ActionNoiseL2Loss=0.1988
+ throughput/total_tokens=167,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=874/500000]
+ train/ActionNoiseL2Loss=0.1863
+ throughput/total_tokens=167,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=875/500000]
+ train/ActionNoiseL2Loss=0.1607
+ throughput/total_tokens=168,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=876/500000]
+ train/ActionNoiseL2Loss=0.1849
+ throughput/total_tokens=168,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=877/500000]
+ train/ActionNoiseL2Loss=0.3026
+ throughput/total_tokens=168,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=878/500000]
+ train/ActionNoiseL2Loss=0.2251
+ throughput/total_tokens=168,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=879/500000]
+ train/ActionNoiseL2Loss=0.2005
+ throughput/total_tokens=168,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=880/500000]
+ optim/total_grad_norm=6.282
+ train/ActionNoiseL2Loss=0.2383
+ throughput/total_tokens=168,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=881/500000]
+ train/ActionNoiseL2Loss=0.2320
+ throughput/total_tokens=169,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=882/500000]
+ train/ActionNoiseL2Loss=0.2604
+ throughput/total_tokens=169,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=883/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=169,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=884/500000]
+ train/ActionNoiseL2Loss=0.1937
+ throughput/total_tokens=169,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=885/500000]
+ train/ActionNoiseL2Loss=0.1879
+ throughput/total_tokens=169,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=886/500000]
+ train/ActionNoiseL2Loss=0.1639
+ throughput/total_tokens=170,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=887/500000]
+ train/ActionNoiseL2Loss=0.2045
+ throughput/total_tokens=170,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=888/500000]
+ train/ActionNoiseL2Loss=0.3338
+ throughput/total_tokens=170,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=889/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=170,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=890/500000]
+ train/ActionNoiseL2Loss=0.2249
+ throughput/total_tokens=170,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=891/500000]
+ train/ActionNoiseL2Loss=0.2751
+ throughput/total_tokens=171,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=892/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=171,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=893/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=171,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=894/500000]
+ train/ActionNoiseL2Loss=0.1543
+ throughput/total_tokens=171,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=895/500000]
+ train/ActionNoiseL2Loss=0.2520
+ throughput/total_tokens=171,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=896/500000]
+ train/ActionNoiseL2Loss=0.1908
+ throughput/total_tokens=172,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=897/500000]
+ train/ActionNoiseL2Loss=0.2354
+ throughput/total_tokens=172,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=898/500000]
+ train/ActionNoiseL2Loss=0.1633
+ throughput/total_tokens=172,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=899/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=172,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=900/500000]
+ optim/total_grad_norm=4.234
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=172,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=901/500000]
+ train/ActionNoiseL2Loss=0.1829
+ throughput/total_tokens=172,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=902/500000]
+ train/ActionNoiseL2Loss=0.2639
+ throughput/total_tokens=173,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=903/500000]
+ train/ActionNoiseL2Loss=0.1656
+ throughput/total_tokens=173,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=904/500000]
+ train/ActionNoiseL2Loss=0.1599
+ throughput/total_tokens=173,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=905/500000]
+ train/ActionNoiseL2Loss=0.1946
+ throughput/total_tokens=173,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=906/500000]
+ train/ActionNoiseL2Loss=0.2344
+ throughput/total_tokens=173,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=907/500000]
+ train/ActionNoiseL2Loss=0.2028
+ throughput/total_tokens=174,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=908/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=174,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=909/500000]
+ train/ActionNoiseL2Loss=0.2320
+ throughput/total_tokens=174,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=910/500000]
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=174,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=911/500000]
+ train/ActionNoiseL2Loss=0.1668
+ throughput/total_tokens=174,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=912/500000]
+ train/ActionNoiseL2Loss=0.1881
+ throughput/total_tokens=175,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=913/500000]
+ train/ActionNoiseL2Loss=0.2558
+ throughput/total_tokens=175,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=914/500000]
+ train/ActionNoiseL2Loss=0.2788
+ throughput/total_tokens=175,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=915/500000]
+ train/ActionNoiseL2Loss=0.2937
+ throughput/total_tokens=175,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=916/500000]
+ train/ActionNoiseL2Loss=0.1501
+ throughput/total_tokens=175,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=917/500000]
+ train/ActionNoiseL2Loss=0.2560
+ throughput/total_tokens=176,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=918/500000]
+ train/ActionNoiseL2Loss=0.1649
+ throughput/total_tokens=176,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=919/500000]
+ train/ActionNoiseL2Loss=0.2139
+ throughput/total_tokens=176,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=920/500000]
+ optim/total_grad_norm=4.964
+ train/ActionNoiseL2Loss=0.1752
+ throughput/total_tokens=176,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=921/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=176,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=922/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=177,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=923/500000]
+ train/ActionNoiseL2Loss=0.2253
+ throughput/total_tokens=177,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=924/500000]
+ train/ActionNoiseL2Loss=0.1525
+ throughput/total_tokens=177,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=925/500000]
+ train/ActionNoiseL2Loss=0.1971
+ throughput/total_tokens=177,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=926/500000]
+ train/ActionNoiseL2Loss=0.2542
+ throughput/total_tokens=177,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=927/500000]
+ train/ActionNoiseL2Loss=0.2288
+ throughput/total_tokens=177,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=928/500000]
+ train/ActionNoiseL2Loss=0.1942
+ throughput/total_tokens=178,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=929/500000]
+ train/ActionNoiseL2Loss=0.2795
+ throughput/total_tokens=178,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=930/500000]
+ train/ActionNoiseL2Loss=0.2466
+ throughput/total_tokens=178,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=931/500000]
+ train/ActionNoiseL2Loss=0.3076
+ throughput/total_tokens=178,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=932/500000]
+ train/ActionNoiseL2Loss=0.2064
+ throughput/total_tokens=178,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=933/500000]
+ train/ActionNoiseL2Loss=0.3169
+ throughput/total_tokens=179,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=934/500000]
+ train/ActionNoiseL2Loss=0.2746
+ throughput/total_tokens=179,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=935/500000]
+ train/ActionNoiseL2Loss=0.2420
+ throughput/total_tokens=179,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=936/500000]
+ train/ActionNoiseL2Loss=0.2821
+ throughput/total_tokens=179,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=937/500000]
+ train/ActionNoiseL2Loss=0.1841
+ throughput/total_tokens=179,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=938/500000]
+ train/ActionNoiseL2Loss=0.2051
+ throughput/total_tokens=180,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=939/500000]
+ train/ActionNoiseL2Loss=0.1772
+ throughput/total_tokens=180,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=940/500000]
+ optim/total_grad_norm=4.169
+ train/ActionNoiseL2Loss=0.1885
+ throughput/total_tokens=180,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=941/500000]
+ train/ActionNoiseL2Loss=0.2361
+ throughput/total_tokens=180,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=942/500000]
+ train/ActionNoiseL2Loss=0.3963
+ throughput/total_tokens=180,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=943/500000]
+ train/ActionNoiseL2Loss=0.1795
+ throughput/total_tokens=181,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=944/500000]
+ train/ActionNoiseL2Loss=0.2065
+ throughput/total_tokens=181,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=945/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=181,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=946/500000]
+ train/ActionNoiseL2Loss=0.2292
+ throughput/total_tokens=181,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=947/500000]
+ train/ActionNoiseL2Loss=0.2152
+ throughput/total_tokens=181,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=948/500000]
+ train/ActionNoiseL2Loss=0.2574
+ throughput/total_tokens=182,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=949/500000]
+ train/ActionNoiseL2Loss=0.1957
+ throughput/total_tokens=182,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=950/500000]
+ train/ActionNoiseL2Loss=0.2222
+ throughput/total_tokens=182,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=951/500000]
+ train/ActionNoiseL2Loss=0.1995
+ throughput/total_tokens=182,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=952/500000]
+ train/ActionNoiseL2Loss=0.1580
+ throughput/total_tokens=182,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=953/500000]
+ train/ActionNoiseL2Loss=0.1398
+ throughput/total_tokens=182,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=954/500000]
+ train/ActionNoiseL2Loss=0.2336
+ throughput/total_tokens=183,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=955/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=183,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=956/500000]
+ train/ActionNoiseL2Loss=0.3194
+ throughput/total_tokens=183,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=957/500000]
+ train/ActionNoiseL2Loss=0.2560
+ throughput/total_tokens=183,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=958/500000]
+ train/ActionNoiseL2Loss=0.3260
+ throughput/total_tokens=183,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=959/500000]
+ train/ActionNoiseL2Loss=0.1757
+ throughput/total_tokens=184,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=960/500000]
+ optim/total_grad_norm=5.015
+ train/ActionNoiseL2Loss=0.2040
+ throughput/total_tokens=184,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=961/500000]
+ train/ActionNoiseL2Loss=0.1979
+ throughput/total_tokens=184,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=962/500000]
+ train/ActionNoiseL2Loss=0.1937
+ throughput/total_tokens=184,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=963/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=184,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=964/500000]
+ train/ActionNoiseL2Loss=0.2257
+ throughput/total_tokens=185,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=965/500000]
+ train/ActionNoiseL2Loss=0.2287
+ throughput/total_tokens=185,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=966/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=185,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=967/500000]
+ train/ActionNoiseL2Loss=0.2983
+ throughput/total_tokens=185,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=968/500000]
+ train/ActionNoiseL2Loss=0.2253
+ throughput/total_tokens=185,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=969/500000]
+ train/ActionNoiseL2Loss=0.2746
+ throughput/total_tokens=186,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=970/500000]
+ train/ActionNoiseL2Loss=0.3058
+ throughput/total_tokens=186,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=971/500000]
+ train/ActionNoiseL2Loss=0.2012
+ throughput/total_tokens=186,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=972/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=186,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=973/500000]
+ train/ActionNoiseL2Loss=0.1961
+ throughput/total_tokens=186,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=974/500000]
+ train/ActionNoiseL2Loss=0.2338
+ throughput/total_tokens=187,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=975/500000]
+ train/ActionNoiseL2Loss=0.3069
+ throughput/total_tokens=187,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=976/500000]
+ train/ActionNoiseL2Loss=0.2313
+ throughput/total_tokens=187,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=977/500000]
+ train/ActionNoiseL2Loss=0.1792
+ throughput/total_tokens=187,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=978/500000]
+ train/ActionNoiseL2Loss=0.2694
+ throughput/total_tokens=187,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=979/500000]
+ train/ActionNoiseL2Loss=0.1751
+ throughput/total_tokens=187,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=980/500000]
+ optim/total_grad_norm=5.630
+ train/ActionNoiseL2Loss=0.1802
+ throughput/total_tokens=188,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=981/500000]
+ train/ActionNoiseL2Loss=0.2371
+ throughput/total_tokens=188,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=982/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=188,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=983/500000]
+ train/ActionNoiseL2Loss=0.2042
+ throughput/total_tokens=188,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=984/500000]
+ train/ActionNoiseL2Loss=0.2137
+ throughput/total_tokens=188,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=985/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=189,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=986/500000]
+ train/ActionNoiseL2Loss=0.2208
+ throughput/total_tokens=189,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=987/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=189,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=988/500000]
+ train/ActionNoiseL2Loss=0.1883
+ throughput/total_tokens=189,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=989/500000]
+ train/ActionNoiseL2Loss=0.3148
+ throughput/total_tokens=189,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=990/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=190,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=991/500000]
+ train/ActionNoiseL2Loss=0.2046
+ throughput/total_tokens=190,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=992/500000]
+ train/ActionNoiseL2Loss=0.1772
+ throughput/total_tokens=190,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=993/500000]
+ train/ActionNoiseL2Loss=0.2331
+ throughput/total_tokens=190,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=994/500000]
+ train/ActionNoiseL2Loss=0.3325
+ throughput/total_tokens=190,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=995/500000]
+ train/ActionNoiseL2Loss=0.1952
+ throughput/total_tokens=191,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=996/500000]
+ train/ActionNoiseL2Loss=0.3278
+ throughput/total_tokens=191,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=997/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=191,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=998/500000]
+ train/ActionNoiseL2Loss=0.2305
+ throughput/total_tokens=191,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=999/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=191,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1000/500000]
+ optim/total_grad_norm=7.084
+ train/ActionNoiseL2Loss=0.3021
+ throughput/total_tokens=192,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/02 [22:37:38] INFO | >> Saving config... checkpoint.py:608
+10/02 [22:38:11] INFO | >> Saving model state... checkpoint.py:796
+10/02 [22:39:25] INFO | >> Saving optim state... checkpoint.py:811
+10/02 [22:40:59] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1001/500000]
+ train/ActionNoiseL2Loss=0.3259
+ throughput/total_tokens=192,192,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=1002/500000]
+ train/ActionNoiseL2Loss=0.2233
+ throughput/total_tokens=192,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1003/500000]
+ train/ActionNoiseL2Loss=0.1776
+ throughput/total_tokens=192,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1004/500000]
+ train/ActionNoiseL2Loss=0.2033
+ throughput/total_tokens=192,768,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1005/500000]
+ train/ActionNoiseL2Loss=0.1698
+ throughput/total_tokens=192,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1006/500000]
+ train/ActionNoiseL2Loss=0.1629
+ throughput/total_tokens=193,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1007/500000]
+ train/ActionNoiseL2Loss=0.1632
+ throughput/total_tokens=193,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1008/500000]
+ train/ActionNoiseL2Loss=0.1862
+ throughput/total_tokens=193,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1009/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=193,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1010/500000]
+ train/ActionNoiseL2Loss=0.2200
+ throughput/total_tokens=193,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1011/500000]
+ train/ActionNoiseL2Loss=0.1868
+ throughput/total_tokens=194,112,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1012/500000]
+ train/ActionNoiseL2Loss=0.2421
+ throughput/total_tokens=194,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1013/500000]
+ train/ActionNoiseL2Loss=0.1790
+ throughput/total_tokens=194,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1014/500000]
+ train/ActionNoiseL2Loss=0.2199
+ throughput/total_tokens=194,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1015/500000]
+ train/ActionNoiseL2Loss=0.2245
+ throughput/total_tokens=194,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1016/500000]
+ train/ActionNoiseL2Loss=0.2646
+ throughput/total_tokens=195,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1017/500000]
+ train/ActionNoiseL2Loss=0.2852
+ throughput/total_tokens=195,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1018/500000]
+ train/ActionNoiseL2Loss=0.1732
+ throughput/total_tokens=195,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1019/500000]
+ train/ActionNoiseL2Loss=0.1980
+ throughput/total_tokens=195,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1020/500000]
+ optim/total_grad_norm=6.463
+ train/ActionNoiseL2Loss=0.2718
+ throughput/total_tokens=195,840,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1021/500000]
+ train/ActionNoiseL2Loss=0.2434
+ throughput/total_tokens=196,032,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1022/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=196,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1023/500000]
+ train/ActionNoiseL2Loss=0.1647
+ throughput/total_tokens=196,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1024/500000]
+ train/ActionNoiseL2Loss=0.1852
+ throughput/total_tokens=196,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1025/500000]
+ train/ActionNoiseL2Loss=0.1973
+ throughput/total_tokens=196,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1026/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=196,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1027/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=197,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1028/500000]
+ train/ActionNoiseL2Loss=0.2475
+ throughput/total_tokens=197,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1029/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=197,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1030/500000]
+ train/ActionNoiseL2Loss=0.1838
+ throughput/total_tokens=197,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1031/500000]
+ train/ActionNoiseL2Loss=0.2413
+ throughput/total_tokens=197,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1032/500000]
+ train/ActionNoiseL2Loss=0.2345
+ throughput/total_tokens=198,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1033/500000]
+ train/ActionNoiseL2Loss=0.2271
+ throughput/total_tokens=198,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1034/500000]
+ train/ActionNoiseL2Loss=0.2145
+ throughput/total_tokens=198,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1035/500000]
+ train/ActionNoiseL2Loss=0.1580
+ throughput/total_tokens=198,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1036/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=198,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1037/500000]
+ train/ActionNoiseL2Loss=0.2262
+ throughput/total_tokens=199,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1038/500000]
+ train/ActionNoiseL2Loss=0.2051
+ throughput/total_tokens=199,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1039/500000]
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=199,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1040/500000]
+ optim/total_grad_norm=5.609
+ train/ActionNoiseL2Loss=0.2353
+ throughput/total_tokens=199,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1041/500000]
+ train/ActionNoiseL2Loss=0.2689
+ throughput/total_tokens=199,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1042/500000]
+ train/ActionNoiseL2Loss=0.1713
+ throughput/total_tokens=200,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1043/500000]
+ train/ActionNoiseL2Loss=0.2610
+ throughput/total_tokens=200,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1044/500000]
+ train/ActionNoiseL2Loss=0.1697
+ throughput/total_tokens=200,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1045/500000]
+ train/ActionNoiseL2Loss=0.1842
+ throughput/total_tokens=200,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1046/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=200,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1047/500000]
+ train/ActionNoiseL2Loss=0.2800
+ throughput/total_tokens=201,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1048/500000]
+ train/ActionNoiseL2Loss=0.2118
+ throughput/total_tokens=201,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1049/500000]
+ train/ActionNoiseL2Loss=0.1672
+ throughput/total_tokens=201,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1050/500000]
+ train/ActionNoiseL2Loss=0.1883
+ throughput/total_tokens=201,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1051/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=201,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1052/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=201,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1053/500000]
+ train/ActionNoiseL2Loss=0.1463
+ throughput/total_tokens=202,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1054/500000]
+ train/ActionNoiseL2Loss=0.2089
+ throughput/total_tokens=202,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1055/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=202,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1056/500000]
+ train/ActionNoiseL2Loss=0.3045
+ throughput/total_tokens=202,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1057/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=202,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1058/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=203,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1059/500000]
+ train/ActionNoiseL2Loss=0.2596
+ throughput/total_tokens=203,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1060/500000]
+ optim/total_grad_norm=5.023
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=203,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1061/500000]
+ train/ActionNoiseL2Loss=0.1448
+ throughput/total_tokens=203,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1062/500000]
+ train/ActionNoiseL2Loss=0.3000
+ throughput/total_tokens=203,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1063/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=204,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1064/500000]
+ train/ActionNoiseL2Loss=0.1630
+ throughput/total_tokens=204,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1065/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=204,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1066/500000]
+ train/ActionNoiseL2Loss=0.1813
+ throughput/total_tokens=204,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1067/500000]
+ train/ActionNoiseL2Loss=0.2794
+ throughput/total_tokens=204,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1068/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=205,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1069/500000]
+ train/ActionNoiseL2Loss=0.3266
+ throughput/total_tokens=205,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1070/500000]
+ train/ActionNoiseL2Loss=0.1640
+ throughput/total_tokens=205,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1071/500000]
+ train/ActionNoiseL2Loss=0.2650
+ throughput/total_tokens=205,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1072/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=205,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1073/500000]
+ train/ActionNoiseL2Loss=0.1967
+ throughput/total_tokens=206,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1074/500000]
+ train/ActionNoiseL2Loss=0.2089
+ throughput/total_tokens=206,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1075/500000]
+ train/ActionNoiseL2Loss=0.2269
+ throughput/total_tokens=206,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1076/500000]
+ train/ActionNoiseL2Loss=0.2779
+ throughput/total_tokens=206,592,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1077/500000]
+ train/ActionNoiseL2Loss=0.2031
+ throughput/total_tokens=206,784,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1078/500000]
+ train/ActionNoiseL2Loss=0.1451
+ throughput/total_tokens=206,976,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1079/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=207,168,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1080/500000]
+ optim/total_grad_norm=5.216
+ train/ActionNoiseL2Loss=0.2109
+ throughput/total_tokens=207,360,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1081/500000]
+ train/ActionNoiseL2Loss=0.2683
+ throughput/total_tokens=207,552,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1082/500000]
+ train/ActionNoiseL2Loss=0.2364
+ throughput/total_tokens=207,744,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1083/500000]
+ train/ActionNoiseL2Loss=0.2511
+ throughput/total_tokens=207,936,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1084/500000]
+ train/ActionNoiseL2Loss=0.2625
+ throughput/total_tokens=208,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1085/500000]
+ train/ActionNoiseL2Loss=0.2259
+ throughput/total_tokens=208,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1086/500000]
+ train/ActionNoiseL2Loss=0.2955
+ throughput/total_tokens=208,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1087/500000]
+ train/ActionNoiseL2Loss=0.2211
+ throughput/total_tokens=208,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1088/500000]
+ train/ActionNoiseL2Loss=0.2289
+ throughput/total_tokens=208,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1089/500000]
+ train/ActionNoiseL2Loss=0.2195
+ throughput/total_tokens=209,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1090/500000]
+ train/ActionNoiseL2Loss=0.1415
+ throughput/total_tokens=209,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1091/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=209,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1092/500000]
+ train/ActionNoiseL2Loss=0.1874
+ throughput/total_tokens=209,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1093/500000]
+ train/ActionNoiseL2Loss=0.2367
+ throughput/total_tokens=209,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1094/500000]
+ train/ActionNoiseL2Loss=0.2836
+ throughput/total_tokens=210,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1095/500000]
+ train/ActionNoiseL2Loss=0.2782
+ throughput/total_tokens=210,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1096/500000]
+ train/ActionNoiseL2Loss=0.2030
+ throughput/total_tokens=210,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1097/500000]
+ train/ActionNoiseL2Loss=0.1779
+ throughput/total_tokens=210,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1098/500000]
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=210,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1099/500000]
+ train/ActionNoiseL2Loss=0.1877
+ throughput/total_tokens=211,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1100/500000]
+ optim/total_grad_norm=4.569
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=211,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1101/500000]
+ train/ActionNoiseL2Loss=0.3045
+ throughput/total_tokens=211,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1102/500000]
+ train/ActionNoiseL2Loss=0.1644
+ throughput/total_tokens=211,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1103/500000]
+ train/ActionNoiseL2Loss=0.2465
+ throughput/total_tokens=211,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1104/500000]
+ train/ActionNoiseL2Loss=0.1872
+ throughput/total_tokens=211,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1105/500000]
+ train/ActionNoiseL2Loss=0.2357
+ throughput/total_tokens=212,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1106/500000]
+ train/ActionNoiseL2Loss=0.3882
+ throughput/total_tokens=212,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1107/500000]
+ train/ActionNoiseL2Loss=0.2496
+ throughput/total_tokens=212,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1108/500000]
+ train/ActionNoiseL2Loss=0.1406
+ throughput/total_tokens=212,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1109/500000]
+ train/ActionNoiseL2Loss=0.2067
+ throughput/total_tokens=212,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1110/500000]
+ train/ActionNoiseL2Loss=0.1967
+ throughput/total_tokens=213,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1111/500000]
+ train/ActionNoiseL2Loss=0.2106
+ throughput/total_tokens=213,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1112/500000]
+ train/ActionNoiseL2Loss=0.1887
+ throughput/total_tokens=213,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1113/500000]
+ train/ActionNoiseL2Loss=0.2498
+ throughput/total_tokens=213,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1114/500000]
+ train/ActionNoiseL2Loss=0.2277
+ throughput/total_tokens=213,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1115/500000]
+ train/ActionNoiseL2Loss=0.2857
+ throughput/total_tokens=214,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1116/500000]
+ train/ActionNoiseL2Loss=0.3374
+ throughput/total_tokens=214,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1117/500000]
+ train/ActionNoiseL2Loss=0.2124
+ throughput/total_tokens=214,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1118/500000]
+ train/ActionNoiseL2Loss=0.3262
+ throughput/total_tokens=214,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1119/500000]
+ train/ActionNoiseL2Loss=0.1398
+ throughput/total_tokens=214,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1120/500000]
+ optim/total_grad_norm=5.041
+ train/ActionNoiseL2Loss=0.1787
+ throughput/total_tokens=215,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1121/500000]
+ train/ActionNoiseL2Loss=0.1826
+ throughput/total_tokens=215,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1122/500000]
+ train/ActionNoiseL2Loss=0.2036
+ throughput/total_tokens=215,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1123/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=215,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1124/500000]
+ train/ActionNoiseL2Loss=0.3056
+ throughput/total_tokens=215,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1125/500000]
+ train/ActionNoiseL2Loss=0.1950
+ throughput/total_tokens=216,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1126/500000]
+ train/ActionNoiseL2Loss=0.1612
+ throughput/total_tokens=216,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1127/500000]
+ train/ActionNoiseL2Loss=0.1877
+ throughput/total_tokens=216,384,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1128/500000]
+ train/ActionNoiseL2Loss=0.2093
+ throughput/total_tokens=216,576,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1129/500000]
+ train/ActionNoiseL2Loss=0.2223
+ throughput/total_tokens=216,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1130/500000]
+ train/ActionNoiseL2Loss=0.2141
+ throughput/total_tokens=216,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1131/500000]
+ train/ActionNoiseL2Loss=0.2212
+ throughput/total_tokens=217,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1132/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=217,344,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1133/500000]
+ train/ActionNoiseL2Loss=0.2022
+ throughput/total_tokens=217,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1134/500000]
+ train/ActionNoiseL2Loss=0.2517
+ throughput/total_tokens=217,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1135/500000]
+ train/ActionNoiseL2Loss=0.2001
+ throughput/total_tokens=217,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1136/500000]
+ train/ActionNoiseL2Loss=0.1709
+ throughput/total_tokens=218,112,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1137/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=218,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1138/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=218,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1139/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=218,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1140/500000]
+ optim/total_grad_norm=5.558
+ train/ActionNoiseL2Loss=0.3292
+ throughput/total_tokens=218,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1141/500000]
+ train/ActionNoiseL2Loss=0.3382
+ throughput/total_tokens=219,072,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1142/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=219,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1143/500000]
+ train/ActionNoiseL2Loss=0.2007
+ throughput/total_tokens=219,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1144/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=219,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1145/500000]
+ train/ActionNoiseL2Loss=0.3150
+ throughput/total_tokens=219,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1146/500000]
+ train/ActionNoiseL2Loss=0.3237
+ throughput/total_tokens=220,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1147/500000]
+ train/ActionNoiseL2Loss=0.2999
+ throughput/total_tokens=220,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1148/500000]
+ train/ActionNoiseL2Loss=0.2380
+ throughput/total_tokens=220,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1149/500000]
+ train/ActionNoiseL2Loss=0.2657
+ throughput/total_tokens=220,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1150/500000]
+ train/ActionNoiseL2Loss=0.1584
+ throughput/total_tokens=220,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1151/500000]
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=220,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1152/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=221,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1153/500000]
+ train/ActionNoiseL2Loss=0.1975
+ throughput/total_tokens=221,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1154/500000]
+ train/ActionNoiseL2Loss=0.1558
+ throughput/total_tokens=221,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1155/500000]
+ train/ActionNoiseL2Loss=0.2482
+ throughput/total_tokens=221,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1156/500000]
+ train/ActionNoiseL2Loss=0.3058
+ throughput/total_tokens=221,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1157/500000]
+ train/ActionNoiseL2Loss=0.2723
+ throughput/total_tokens=222,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1158/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=222,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1159/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=222,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1160/500000]
+ optim/total_grad_norm=3.304
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=222,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1161/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=222,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1162/500000]
+ train/ActionNoiseL2Loss=0.2470
+ throughput/total_tokens=223,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1163/500000]
+ train/ActionNoiseL2Loss=0.2122
+ throughput/total_tokens=223,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1164/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=223,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1165/500000]
+ train/ActionNoiseL2Loss=0.2243
+ throughput/total_tokens=223,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1166/500000]
+ train/ActionNoiseL2Loss=0.1633
+ throughput/total_tokens=223,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1167/500000]
+ train/ActionNoiseL2Loss=0.2618
+ throughput/total_tokens=224,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1168/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=224,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1169/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=224,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1170/500000]
+ train/ActionNoiseL2Loss=0.2172
+ throughput/total_tokens=224,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1171/500000]
+ train/ActionNoiseL2Loss=0.4322
+ throughput/total_tokens=224,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1172/500000]
+ train/ActionNoiseL2Loss=0.1868
+ throughput/total_tokens=225,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1173/500000]
+ train/ActionNoiseL2Loss=0.2132
+ throughput/total_tokens=225,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1174/500000]
+ train/ActionNoiseL2Loss=0.2790
+ throughput/total_tokens=225,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1175/500000]
+ train/ActionNoiseL2Loss=0.1964
+ throughput/total_tokens=225,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1176/500000]
+ train/ActionNoiseL2Loss=0.1537
+ throughput/total_tokens=225,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1177/500000]
+ train/ActionNoiseL2Loss=0.1568
+ throughput/total_tokens=225,984,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1178/500000]
+ train/ActionNoiseL2Loss=0.2097
+ throughput/total_tokens=226,176,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1179/500000]
+ train/ActionNoiseL2Loss=0.2236
+ throughput/total_tokens=226,368,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1180/500000]
+ optim/total_grad_norm=5.071
+ train/ActionNoiseL2Loss=0.1867
+ throughput/total_tokens=226,560,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1181/500000]
+ train/ActionNoiseL2Loss=0.2706
+ throughput/total_tokens=226,752,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1182/500000]
+ train/ActionNoiseL2Loss=0.1742
+ throughput/total_tokens=226,944,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1183/500000]
+ train/ActionNoiseL2Loss=0.1670
+ throughput/total_tokens=227,136,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1184/500000]
+ train/ActionNoiseL2Loss=0.1713
+ throughput/total_tokens=227,328,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1185/500000]
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=227,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1186/500000]
+ train/ActionNoiseL2Loss=0.2627
+ throughput/total_tokens=227,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1187/500000]
+ train/ActionNoiseL2Loss=0.2699
+ throughput/total_tokens=227,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1188/500000]
+ train/ActionNoiseL2Loss=0.2858
+ throughput/total_tokens=228,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1189/500000]
+ train/ActionNoiseL2Loss=0.2844
+ throughput/total_tokens=228,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1190/500000]
+ train/ActionNoiseL2Loss=0.1694
+ throughput/total_tokens=228,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1191/500000]
+ train/ActionNoiseL2Loss=0.2304
+ throughput/total_tokens=228,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1192/500000]
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=228,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1193/500000]
+ train/ActionNoiseL2Loss=0.1828
+ throughput/total_tokens=229,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1194/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=229,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1195/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=229,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1196/500000]
+ train/ActionNoiseL2Loss=0.1965
+ throughput/total_tokens=229,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1197/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=229,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1198/500000]
+ train/ActionNoiseL2Loss=0.1876
+ throughput/total_tokens=230,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1199/500000]
+ train/ActionNoiseL2Loss=0.1630
+ throughput/total_tokens=230,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1200/500000]
+ optim/total_grad_norm=4.219
+ train/ActionNoiseL2Loss=0.1856
+ throughput/total_tokens=230,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1201/500000]
+ train/ActionNoiseL2Loss=0.2077
+ throughput/total_tokens=230,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1202/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=230,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1203/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=230,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1204/500000]
+ train/ActionNoiseL2Loss=0.2637
+ throughput/total_tokens=231,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1205/500000]
+ train/ActionNoiseL2Loss=0.1558
+ throughput/total_tokens=231,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1206/500000]
+ train/ActionNoiseL2Loss=0.2507
+ throughput/total_tokens=231,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1207/500000]
+ train/ActionNoiseL2Loss=0.1707
+ throughput/total_tokens=231,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1208/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=231,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1209/500000]
+ train/ActionNoiseL2Loss=0.1742
+ throughput/total_tokens=232,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1210/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=232,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1211/500000]
+ train/ActionNoiseL2Loss=0.2902
+ throughput/total_tokens=232,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1212/500000]
+ train/ActionNoiseL2Loss=0.1716
+ throughput/total_tokens=232,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1213/500000]
+ train/ActionNoiseL2Loss=0.3157
+ throughput/total_tokens=232,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1214/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=233,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1215/500000]
+ train/ActionNoiseL2Loss=0.2813
+ throughput/total_tokens=233,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1216/500000]
+ train/ActionNoiseL2Loss=0.3108
+ throughput/total_tokens=233,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1217/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=233,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1218/500000]
+ train/ActionNoiseL2Loss=0.2257
+ throughput/total_tokens=233,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1219/500000]
+ train/ActionNoiseL2Loss=0.1993
+ throughput/total_tokens=234,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1220/500000]
+ optim/total_grad_norm=3.464
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=234,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1221/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=234,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1222/500000]
+ train/ActionNoiseL2Loss=0.3843
+ throughput/total_tokens=234,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1223/500000]
+ train/ActionNoiseL2Loss=0.2484
+ throughput/total_tokens=234,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1224/500000]
+ train/ActionNoiseL2Loss=0.2230
+ throughput/total_tokens=235,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1225/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=235,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1226/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=235,392,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1227/500000]
+ train/ActionNoiseL2Loss=0.2038
+ throughput/total_tokens=235,584,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1228/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=235,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1229/500000]
+ train/ActionNoiseL2Loss=0.1691
+ throughput/total_tokens=235,968,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1230/500000]
+ train/ActionNoiseL2Loss=0.1771
+ throughput/total_tokens=236,160,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1231/500000]
+ train/ActionNoiseL2Loss=0.2498
+ throughput/total_tokens=236,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1232/500000]
+ train/ActionNoiseL2Loss=0.2554
+ throughput/total_tokens=236,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1233/500000]
+ train/ActionNoiseL2Loss=0.2132
+ throughput/total_tokens=236,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1234/500000]
+ train/ActionNoiseL2Loss=0.3286
+ throughput/total_tokens=236,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1235/500000]
+ train/ActionNoiseL2Loss=0.2514
+ throughput/total_tokens=237,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1236/500000]
+ train/ActionNoiseL2Loss=0.2383
+ throughput/total_tokens=237,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1237/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=237,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1238/500000]
+ train/ActionNoiseL2Loss=0.1698
+ throughput/total_tokens=237,696,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1239/500000]
+ train/ActionNoiseL2Loss=0.2154
+ throughput/total_tokens=237,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1240/500000]
+ optim/total_grad_norm=4.880
+ train/ActionNoiseL2Loss=0.1894
+ throughput/total_tokens=238,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1241/500000]
+ train/ActionNoiseL2Loss=0.2171
+ throughput/total_tokens=238,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1242/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=238,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1243/500000]
+ train/ActionNoiseL2Loss=0.2288
+ throughput/total_tokens=238,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1244/500000]
+ train/ActionNoiseL2Loss=0.2001
+ throughput/total_tokens=238,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1245/500000]
+ train/ActionNoiseL2Loss=0.2451
+ throughput/total_tokens=239,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1246/500000]
+ train/ActionNoiseL2Loss=0.2267
+ throughput/total_tokens=239,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1247/500000]
+ train/ActionNoiseL2Loss=0.1746
+ throughput/total_tokens=239,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1248/500000]
+ train/ActionNoiseL2Loss=0.2002
+ throughput/total_tokens=239,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1249/500000]
+ train/ActionNoiseL2Loss=0.1641
+ throughput/total_tokens=239,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1250/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=240,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1251/500000]
+ train/ActionNoiseL2Loss=0.1808
+ throughput/total_tokens=240,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1252/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=240,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1253/500000]
+ train/ActionNoiseL2Loss=0.1885
+ throughput/total_tokens=240,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1254/500000]
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=240,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1255/500000]
+ train/ActionNoiseL2Loss=0.1503
+ throughput/total_tokens=240,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1256/500000]
+ train/ActionNoiseL2Loss=0.2085
+ throughput/total_tokens=241,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1257/500000]
+ train/ActionNoiseL2Loss=0.1860
+ throughput/total_tokens=241,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1258/500000]
+ train/ActionNoiseL2Loss=0.1649
+ throughput/total_tokens=241,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1259/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=241,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1260/500000]
+ optim/total_grad_norm=4.447
+ train/ActionNoiseL2Loss=0.1866
+ throughput/total_tokens=241,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1261/500000]
+ train/ActionNoiseL2Loss=0.1828
+ throughput/total_tokens=242,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1262/500000]
+ train/ActionNoiseL2Loss=0.2586
+ throughput/total_tokens=242,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1263/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=242,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1264/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=242,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1265/500000]
+ train/ActionNoiseL2Loss=0.1758
+ throughput/total_tokens=242,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1266/500000]
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=243,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1267/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=243,264,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1268/500000]
+ train/ActionNoiseL2Loss=0.1651
+ throughput/total_tokens=243,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1269/500000]
+ train/ActionNoiseL2Loss=0.2423
+ throughput/total_tokens=243,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1270/500000]
+ train/ActionNoiseL2Loss=0.2249
+ throughput/total_tokens=243,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1271/500000]
+ train/ActionNoiseL2Loss=0.1364
+ throughput/total_tokens=244,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1272/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=244,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1273/500000]
+ train/ActionNoiseL2Loss=0.1831
+ throughput/total_tokens=244,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1274/500000]
+ train/ActionNoiseL2Loss=0.1823
+ throughput/total_tokens=244,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1275/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=244,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1276/500000]
+ train/ActionNoiseL2Loss=0.1778
+ throughput/total_tokens=244,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1277/500000]
+ train/ActionNoiseL2Loss=0.1415
+ throughput/total_tokens=245,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1278/500000]
+ train/ActionNoiseL2Loss=0.1640
+ throughput/total_tokens=245,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1279/500000]
+ train/ActionNoiseL2Loss=0.2024
+ throughput/total_tokens=245,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1280/500000]
+ optim/total_grad_norm=3.892
+ train/ActionNoiseL2Loss=0.1842
+ throughput/total_tokens=245,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1281/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=245,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1282/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=246,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1283/500000]
+ train/ActionNoiseL2Loss=0.2088
+ throughput/total_tokens=246,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1284/500000]
+ train/ActionNoiseL2Loss=0.2221
+ throughput/total_tokens=246,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1285/500000]
+ train/ActionNoiseL2Loss=0.1955
+ throughput/total_tokens=246,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1286/500000]
+ train/ActionNoiseL2Loss=0.2029
+ throughput/total_tokens=246,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1287/500000]
+ train/ActionNoiseL2Loss=0.2037
+ throughput/total_tokens=247,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1288/500000]
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=247,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1289/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=247,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1290/500000]
+ train/ActionNoiseL2Loss=0.2139
+ throughput/total_tokens=247,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1291/500000]
+ train/ActionNoiseL2Loss=0.2923
+ throughput/total_tokens=247,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1292/500000]
+ train/ActionNoiseL2Loss=0.1744
+ throughput/total_tokens=248,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1293/500000]
+ train/ActionNoiseL2Loss=0.3036
+ throughput/total_tokens=248,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1294/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=248,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1295/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=248,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1296/500000]
+ train/ActionNoiseL2Loss=0.3058
+ throughput/total_tokens=248,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1297/500000]
+ train/ActionNoiseL2Loss=0.2064
+ throughput/total_tokens=249,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1298/500000]
+ train/ActionNoiseL2Loss=0.3043
+ throughput/total_tokens=249,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1299/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=249,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1300/500000]
+ optim/total_grad_norm=3.585
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=249,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1301/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=249,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1302/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=249,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1303/500000]
+ train/ActionNoiseL2Loss=0.1622
+ throughput/total_tokens=250,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1304/500000]
+ train/ActionNoiseL2Loss=0.1876
+ throughput/total_tokens=250,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1305/500000]
+ train/ActionNoiseL2Loss=0.1685
+ throughput/total_tokens=250,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1306/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=250,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1307/500000]
+ train/ActionNoiseL2Loss=0.2077
+ throughput/total_tokens=250,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1308/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=251,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1309/500000]
+ train/ActionNoiseL2Loss=0.1684
+ throughput/total_tokens=251,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1310/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=251,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1311/500000]
+ train/ActionNoiseL2Loss=0.1610
+ throughput/total_tokens=251,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1312/500000]
+ train/ActionNoiseL2Loss=0.1967
+ throughput/total_tokens=251,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1313/500000]
+ train/ActionNoiseL2Loss=0.1995
+ throughput/total_tokens=252,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1314/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=252,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1315/500000]
+ train/ActionNoiseL2Loss=0.1830
+ throughput/total_tokens=252,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1316/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=252,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1317/500000]
+ train/ActionNoiseL2Loss=0.1688
+ throughput/total_tokens=252,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1318/500000]
+ train/ActionNoiseL2Loss=0.2286
+ throughput/total_tokens=253,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1319/500000]
+ train/ActionNoiseL2Loss=0.2382
+ throughput/total_tokens=253,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1320/500000]
+ optim/total_grad_norm=5.794
+ train/ActionNoiseL2Loss=0.2444
+ throughput/total_tokens=253,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1321/500000]
+ train/ActionNoiseL2Loss=0.2618
+ throughput/total_tokens=253,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1322/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=253,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1323/500000]
+ train/ActionNoiseL2Loss=0.1964
+ throughput/total_tokens=254,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1324/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=254,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1325/500000]
+ train/ActionNoiseL2Loss=0.1981
+ throughput/total_tokens=254,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1326/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=254,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1327/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=254,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1328/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=254,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1329/500000]
+ train/ActionNoiseL2Loss=0.2181
+ throughput/total_tokens=255,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1330/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=255,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1331/500000]
+ train/ActionNoiseL2Loss=0.2522
+ throughput/total_tokens=255,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1332/500000]
+ train/ActionNoiseL2Loss=0.2585
+ throughput/total_tokens=255,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1333/500000]
+ train/ActionNoiseL2Loss=0.2099
+ throughput/total_tokens=255,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1334/500000]
+ train/ActionNoiseL2Loss=0.2423
+ throughput/total_tokens=256,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1335/500000]
+ train/ActionNoiseL2Loss=0.2287
+ throughput/total_tokens=256,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1336/500000]
+ train/ActionNoiseL2Loss=0.1974
+ throughput/total_tokens=256,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1337/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=256,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1338/500000]
+ train/ActionNoiseL2Loss=0.2163
+ throughput/total_tokens=256,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1339/500000]
+ train/ActionNoiseL2Loss=0.1630
+ throughput/total_tokens=257,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1340/500000]
+ optim/total_grad_norm=4.385
+ train/ActionNoiseL2Loss=0.2040
+ throughput/total_tokens=257,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1341/500000]
+ train/ActionNoiseL2Loss=0.1943
+ throughput/total_tokens=257,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1342/500000]
+ train/ActionNoiseL2Loss=0.2059
+ throughput/total_tokens=257,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1343/500000]
+ train/ActionNoiseL2Loss=0.1436
+ throughput/total_tokens=257,856,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1344/500000]
+ train/ActionNoiseL2Loss=0.2836
+ throughput/total_tokens=258,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1345/500000]
+ train/ActionNoiseL2Loss=0.1769
+ throughput/total_tokens=258,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1346/500000]
+ train/ActionNoiseL2Loss=0.1823
+ throughput/total_tokens=258,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1347/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=258,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1348/500000]
+ train/ActionNoiseL2Loss=0.3939
+ throughput/total_tokens=258,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1349/500000]
+ train/ActionNoiseL2Loss=0.1827
+ throughput/total_tokens=259,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1350/500000]
+ train/ActionNoiseL2Loss=0.2415
+ throughput/total_tokens=259,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1351/500000]
+ train/ActionNoiseL2Loss=0.1787
+ throughput/total_tokens=259,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1352/500000]
+ train/ActionNoiseL2Loss=0.1970
+ throughput/total_tokens=259,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1353/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=259,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1354/500000]
+ train/ActionNoiseL2Loss=0.3070
+ throughput/total_tokens=259,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1355/500000]
+ train/ActionNoiseL2Loss=0.1985
+ throughput/total_tokens=260,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1356/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=260,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1357/500000]
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=260,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1358/500000]
+ train/ActionNoiseL2Loss=0.2542
+ throughput/total_tokens=260,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1359/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=260,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1360/500000]
+ optim/total_grad_norm=4.505
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=261,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1361/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=261,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1362/500000]
+ train/ActionNoiseL2Loss=0.2646
+ throughput/total_tokens=261,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1363/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=261,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1364/500000]
+ train/ActionNoiseL2Loss=0.2236
+ throughput/total_tokens=261,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1365/500000]
+ train/ActionNoiseL2Loss=0.1666
+ throughput/total_tokens=262,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1366/500000]
+ train/ActionNoiseL2Loss=0.2527
+ throughput/total_tokens=262,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1367/500000]
+ train/ActionNoiseL2Loss=0.1801
+ throughput/total_tokens=262,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1368/500000]
+ train/ActionNoiseL2Loss=0.1670
+ throughput/total_tokens=262,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1369/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=262,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1370/500000]
+ train/ActionNoiseL2Loss=0.3687
+ throughput/total_tokens=263,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1371/500000]
+ train/ActionNoiseL2Loss=0.1593
+ throughput/total_tokens=263,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1372/500000]
+ train/ActionNoiseL2Loss=0.3101
+ throughput/total_tokens=263,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1373/500000]
+ train/ActionNoiseL2Loss=0.2362
+ throughput/total_tokens=263,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1374/500000]
+ train/ActionNoiseL2Loss=0.2849
+ throughput/total_tokens=263,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1375/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=264,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1376/500000]
+ train/ActionNoiseL2Loss=0.1603
+ throughput/total_tokens=264,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1377/500000]
+ train/ActionNoiseL2Loss=0.1626
+ throughput/total_tokens=264,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1378/500000]
+ train/ActionNoiseL2Loss=0.1933
+ throughput/total_tokens=264,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1379/500000]
+ train/ActionNoiseL2Loss=0.2017
+ throughput/total_tokens=264,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1380/500000]
+ optim/total_grad_norm=3.669
+ train/ActionNoiseL2Loss=0.1686
+ throughput/total_tokens=264,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1381/500000]
+ train/ActionNoiseL2Loss=0.2207
+ throughput/total_tokens=265,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1382/500000]
+ train/ActionNoiseL2Loss=0.4008
+ throughput/total_tokens=265,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1383/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=265,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1384/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=265,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1385/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=265,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1386/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=266,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1387/500000]
+ train/ActionNoiseL2Loss=0.2255
+ throughput/total_tokens=266,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1388/500000]
+ train/ActionNoiseL2Loss=0.2312
+ throughput/total_tokens=266,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1389/500000]
+ train/ActionNoiseL2Loss=0.2993
+ throughput/total_tokens=266,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1390/500000]
+ train/ActionNoiseL2Loss=0.1910
+ throughput/total_tokens=266,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1391/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=267,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1392/500000]
+ train/ActionNoiseL2Loss=0.1476
+ throughput/total_tokens=267,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1393/500000]
+ train/ActionNoiseL2Loss=0.2097
+ throughput/total_tokens=267,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1394/500000]
+ train/ActionNoiseL2Loss=0.1588
+ throughput/total_tokens=267,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1395/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=267,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1396/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=268,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1397/500000]
+ train/ActionNoiseL2Loss=0.1793
+ throughput/total_tokens=268,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1398/500000]
+ train/ActionNoiseL2Loss=0.1756
+ throughput/total_tokens=268,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1399/500000]
+ train/ActionNoiseL2Loss=0.2774
+ throughput/total_tokens=268,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1400/500000]
+ optim/total_grad_norm=2.952
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=268,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1401/500000]
+ train/ActionNoiseL2Loss=0.1947
+ throughput/total_tokens=268,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1402/500000]
+ train/ActionNoiseL2Loss=0.2384
+ throughput/total_tokens=269,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1403/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=269,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1404/500000]
+ train/ActionNoiseL2Loss=0.2337
+ throughput/total_tokens=269,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1405/500000]
+ train/ActionNoiseL2Loss=0.1684
+ throughput/total_tokens=269,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1406/500000]
+ train/ActionNoiseL2Loss=0.1914
+ throughput/total_tokens=269,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1407/500000]
+ train/ActionNoiseL2Loss=0.1523
+ throughput/total_tokens=270,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1408/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=270,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1409/500000]
+ train/ActionNoiseL2Loss=0.1685
+ throughput/total_tokens=270,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1410/500000]
+ train/ActionNoiseL2Loss=0.2978
+ throughput/total_tokens=270,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1411/500000]
+ train/ActionNoiseL2Loss=0.2678
+ throughput/total_tokens=270,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1412/500000]
+ train/ActionNoiseL2Loss=0.1669
+ throughput/total_tokens=271,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1413/500000]
+ train/ActionNoiseL2Loss=0.2988
+ throughput/total_tokens=271,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1414/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=271,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1415/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=271,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1416/500000]
+ train/ActionNoiseL2Loss=0.2073
+ throughput/total_tokens=271,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1417/500000]
+ train/ActionNoiseL2Loss=0.2071
+ throughput/total_tokens=272,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1418/500000]
+ train/ActionNoiseL2Loss=0.2105
+ throughput/total_tokens=272,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1419/500000]
+ train/ActionNoiseL2Loss=0.2409
+ throughput/total_tokens=272,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1420/500000]
+ optim/total_grad_norm=3.405
+ train/ActionNoiseL2Loss=0.1568
+ throughput/total_tokens=272,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1421/500000]
+ train/ActionNoiseL2Loss=0.1483
+ throughput/total_tokens=272,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1422/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=273,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1423/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=273,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1424/500000]
+ train/ActionNoiseL2Loss=0.2582
+ throughput/total_tokens=273,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1425/500000]
+ train/ActionNoiseL2Loss=0.1987
+ throughput/total_tokens=273,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1426/500000]
+ train/ActionNoiseL2Loss=0.1535
+ throughput/total_tokens=273,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1427/500000]
+ train/ActionNoiseL2Loss=0.1975
+ throughput/total_tokens=273,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1428/500000]
+ train/ActionNoiseL2Loss=0.1780
+ throughput/total_tokens=274,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1429/500000]
+ train/ActionNoiseL2Loss=0.2361
+ throughput/total_tokens=274,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1430/500000]
+ train/ActionNoiseL2Loss=0.1427
+ throughput/total_tokens=274,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1431/500000]
+ train/ActionNoiseL2Loss=0.1684
+ throughput/total_tokens=274,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1432/500000]
+ train/ActionNoiseL2Loss=0.2620
+ throughput/total_tokens=274,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1433/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=275,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1434/500000]
+ train/ActionNoiseL2Loss=0.1745
+ throughput/total_tokens=275,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1435/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=275,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1436/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=275,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1437/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=275,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1438/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=276,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1439/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=276,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1440/500000]
+ optim/total_grad_norm=2.043
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=276,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1441/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=276,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1442/500000]
+ train/ActionNoiseL2Loss=0.2546
+ throughput/total_tokens=276,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1443/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=277,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1444/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=277,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1445/500000]
+ train/ActionNoiseL2Loss=0.1783
+ throughput/total_tokens=277,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1446/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=277,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1447/500000]
+ train/ActionNoiseL2Loss=0.2625
+ throughput/total_tokens=277,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1448/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=278,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1449/500000]
+ train/ActionNoiseL2Loss=0.2143
+ throughput/total_tokens=278,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1450/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=278,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1451/500000]
+ train/ActionNoiseL2Loss=0.2815
+ throughput/total_tokens=278,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1452/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=278,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1453/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=278,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1454/500000]
+ train/ActionNoiseL2Loss=0.2792
+ throughput/total_tokens=279,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1455/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=279,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1456/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=279,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1457/500000]
+ train/ActionNoiseL2Loss=0.1610
+ throughput/total_tokens=279,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1458/500000]
+ train/ActionNoiseL2Loss=0.1762
+ throughput/total_tokens=279,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1459/500000]
+ train/ActionNoiseL2Loss=0.1936
+ throughput/total_tokens=280,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1460/500000]
+ optim/total_grad_norm=5.481
+ train/ActionNoiseL2Loss=0.2157
+ throughput/total_tokens=280,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1461/500000]
+ train/ActionNoiseL2Loss=0.3143
+ throughput/total_tokens=280,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1462/500000]
+ train/ActionNoiseL2Loss=0.1512
+ throughput/total_tokens=280,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1463/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=280,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1464/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=281,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1465/500000]
+ train/ActionNoiseL2Loss=0.1533
+ throughput/total_tokens=281,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1466/500000]
+ train/ActionNoiseL2Loss=0.1584
+ throughput/total_tokens=281,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1467/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=281,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1468/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=281,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1469/500000]
+ train/ActionNoiseL2Loss=0.1763
+ throughput/total_tokens=282,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1470/500000]
+ train/ActionNoiseL2Loss=0.2094
+ throughput/total_tokens=282,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1471/500000]
+ train/ActionNoiseL2Loss=0.2020
+ throughput/total_tokens=282,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1472/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=282,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1473/500000]
+ train/ActionNoiseL2Loss=0.2475
+ throughput/total_tokens=282,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1474/500000]
+ train/ActionNoiseL2Loss=0.2545
+ throughput/total_tokens=283,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1475/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=283,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1476/500000]
+ train/ActionNoiseL2Loss=0.2056
+ throughput/total_tokens=283,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1477/500000]
+ train/ActionNoiseL2Loss=0.2428
+ throughput/total_tokens=283,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1478/500000]
+ train/ActionNoiseL2Loss=0.1985
+ throughput/total_tokens=283,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1479/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=283,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1480/500000]
+ optim/total_grad_norm=2.925
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=284,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1481/500000]
+ train/ActionNoiseL2Loss=0.2058
+ throughput/total_tokens=284,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1482/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=284,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1483/500000]
+ train/ActionNoiseL2Loss=0.2388
+ throughput/total_tokens=284,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1484/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=284,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1485/500000]
+ train/ActionNoiseL2Loss=0.2164
+ throughput/total_tokens=285,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1486/500000]
+ train/ActionNoiseL2Loss=0.1415
+ throughput/total_tokens=285,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1487/500000]
+ train/ActionNoiseL2Loss=0.2121
+ throughput/total_tokens=285,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1488/500000]
+ train/ActionNoiseL2Loss=0.2548
+ throughput/total_tokens=285,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1489/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=285,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1490/500000]
+ train/ActionNoiseL2Loss=0.1880
+ throughput/total_tokens=286,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1491/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=286,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1492/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=286,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1493/500000]
+ train/ActionNoiseL2Loss=0.2249
+ throughput/total_tokens=286,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1494/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=286,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1495/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=287,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1496/500000]
+ train/ActionNoiseL2Loss=0.1752
+ throughput/total_tokens=287,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1497/500000]
+ train/ActionNoiseL2Loss=0.2656
+ throughput/total_tokens=287,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1498/500000]
+ train/ActionNoiseL2Loss=0.2449
+ throughput/total_tokens=287,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1499/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=287,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1500/500000]
+ optim/total_grad_norm=2.646
+ train/ActionNoiseL2Loss=0.1778
+ throughput/total_tokens=288,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+10/03 [01:35:00] INFO | >> Saving config... checkpoint.py:608
+10/03 [01:35:34] INFO | >> Saving model state... checkpoint.py:796
+10/03 [01:36:47] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [01:38:19] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1501/500000]
+ train/ActionNoiseL2Loss=0.1597
+ throughput/total_tokens=288,192,000
+ throughput/device/tokens_per_second=1,194
+ throughput/device/batches_per_second=0.0498
+[step=1502/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=288,384,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=1503/500000]
+ train/ActionNoiseL2Loss=0.2897
+ throughput/total_tokens=288,576,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=1504/500000]
+ train/ActionNoiseL2Loss=0.2598
+ throughput/total_tokens=288,768,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=1505/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=288,960,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1506/500000]
+ train/ActionNoiseL2Loss=0.2580
+ throughput/total_tokens=289,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1507/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=289,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1508/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=289,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1509/500000]
+ train/ActionNoiseL2Loss=0.2250
+ throughput/total_tokens=289,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1510/500000]
+ train/ActionNoiseL2Loss=0.2292
+ throughput/total_tokens=289,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1511/500000]
+ train/ActionNoiseL2Loss=0.1884
+ throughput/total_tokens=290,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1512/500000]
+ train/ActionNoiseL2Loss=0.1935
+ throughput/total_tokens=290,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1513/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=290,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1514/500000]
+ train/ActionNoiseL2Loss=0.1773
+ throughput/total_tokens=290,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1515/500000]
+ train/ActionNoiseL2Loss=0.2184
+ throughput/total_tokens=290,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1516/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=291,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1517/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=291,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1518/500000]
+ train/ActionNoiseL2Loss=0.1881
+ throughput/total_tokens=291,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1519/500000]
+ train/ActionNoiseL2Loss=0.1443
+ throughput/total_tokens=291,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1520/500000]
+ optim/total_grad_norm=2.598
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=291,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1521/500000]
+ train/ActionNoiseL2Loss=0.1662
+ throughput/total_tokens=292,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1522/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=292,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1523/500000]
+ train/ActionNoiseL2Loss=0.2002
+ throughput/total_tokens=292,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1524/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=292,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1525/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=292,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1526/500000]
+ train/ActionNoiseL2Loss=0.2584
+ throughput/total_tokens=292,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1527/500000]
+ train/ActionNoiseL2Loss=0.1847
+ throughput/total_tokens=293,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1528/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=293,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1529/500000]
+ train/ActionNoiseL2Loss=0.1433
+ throughput/total_tokens=293,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1530/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=293,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1531/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=293,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1532/500000]
+ train/ActionNoiseL2Loss=0.2617
+ throughput/total_tokens=294,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1533/500000]
+ train/ActionNoiseL2Loss=0.2220
+ throughput/total_tokens=294,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1534/500000]
+ train/ActionNoiseL2Loss=0.2401
+ throughput/total_tokens=294,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1535/500000]
+ train/ActionNoiseL2Loss=0.1768
+ throughput/total_tokens=294,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1536/500000]
+ train/ActionNoiseL2Loss=0.1780
+ throughput/total_tokens=294,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1537/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=295,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1538/500000]
+ train/ActionNoiseL2Loss=0.2775
+ throughput/total_tokens=295,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1539/500000]
+ train/ActionNoiseL2Loss=0.1974
+ throughput/total_tokens=295,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1540/500000]
+ optim/total_grad_norm=3.877
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=295,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1541/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=295,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1542/500000]
+ train/ActionNoiseL2Loss=0.1728
+ throughput/total_tokens=296,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1543/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=296,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1544/500000]
+ train/ActionNoiseL2Loss=0.2066
+ throughput/total_tokens=296,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1545/500000]
+ train/ActionNoiseL2Loss=0.1993
+ throughput/total_tokens=296,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1546/500000]
+ train/ActionNoiseL2Loss=0.1656
+ throughput/total_tokens=296,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1547/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=297,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1548/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=297,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1549/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=297,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1550/500000]
+ train/ActionNoiseL2Loss=0.1945
+ throughput/total_tokens=297,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1551/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=297,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1552/500000]
+ train/ActionNoiseL2Loss=0.1796
+ throughput/total_tokens=297,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1553/500000]
+ train/ActionNoiseL2Loss=0.1914
+ throughput/total_tokens=298,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1554/500000]
+ train/ActionNoiseL2Loss=0.2228
+ throughput/total_tokens=298,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1555/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=298,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1556/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=298,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1557/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=298,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1558/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=299,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1559/500000]
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=299,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1560/500000]
+ optim/total_grad_norm=3.008
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=299,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1561/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=299,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1562/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=299,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1563/500000]
+ train/ActionNoiseL2Loss=0.1743
+ throughput/total_tokens=300,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1564/500000]
+ train/ActionNoiseL2Loss=0.2295
+ throughput/total_tokens=300,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1565/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=300,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1566/500000]
+ train/ActionNoiseL2Loss=0.2739
+ throughput/total_tokens=300,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1567/500000]
+ train/ActionNoiseL2Loss=0.1415
+ throughput/total_tokens=300,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1568/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=301,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1569/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=301,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1570/500000]
+ train/ActionNoiseL2Loss=0.2266
+ throughput/total_tokens=301,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1571/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=301,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1572/500000]
+ train/ActionNoiseL2Loss=0.1599
+ throughput/total_tokens=301,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1573/500000]
+ train/ActionNoiseL2Loss=0.1807
+ throughput/total_tokens=302,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1574/500000]
+ train/ActionNoiseL2Loss=0.1697
+ throughput/total_tokens=302,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1575/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=302,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1576/500000]
+ train/ActionNoiseL2Loss=0.2487
+ throughput/total_tokens=302,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1577/500000]
+ train/ActionNoiseL2Loss=0.2210
+ throughput/total_tokens=302,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1578/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=302,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1579/500000]
+ train/ActionNoiseL2Loss=0.2315
+ throughput/total_tokens=303,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1580/500000]
+ optim/total_grad_norm=3.211
+ train/ActionNoiseL2Loss=0.1905
+ throughput/total_tokens=303,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1581/500000]
+ train/ActionNoiseL2Loss=0.1778
+ throughput/total_tokens=303,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1582/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=303,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1583/500000]
+ train/ActionNoiseL2Loss=0.1701
+ throughput/total_tokens=303,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1584/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=304,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1585/500000]
+ train/ActionNoiseL2Loss=0.2099
+ throughput/total_tokens=304,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1586/500000]
+ train/ActionNoiseL2Loss=0.2084
+ throughput/total_tokens=304,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1587/500000]
+ train/ActionNoiseL2Loss=0.2141
+ throughput/total_tokens=304,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1588/500000]
+ train/ActionNoiseL2Loss=0.1838
+ throughput/total_tokens=304,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1589/500000]
+ train/ActionNoiseL2Loss=0.2242
+ throughput/total_tokens=305,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1590/500000]
+ train/ActionNoiseL2Loss=0.2030
+ throughput/total_tokens=305,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1591/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=305,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1592/500000]
+ train/ActionNoiseL2Loss=0.2023
+ throughput/total_tokens=305,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1593/500000]
+ train/ActionNoiseL2Loss=0.1534
+ throughput/total_tokens=305,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1594/500000]
+ train/ActionNoiseL2Loss=0.1540
+ throughput/total_tokens=306,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1595/500000]
+ train/ActionNoiseL2Loss=0.2329
+ throughput/total_tokens=306,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1596/500000]
+ train/ActionNoiseL2Loss=0.1388
+ throughput/total_tokens=306,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1597/500000]
+ train/ActionNoiseL2Loss=0.1810
+ throughput/total_tokens=306,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1598/500000]
+ train/ActionNoiseL2Loss=0.1762
+ throughput/total_tokens=306,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1599/500000]
+ train/ActionNoiseL2Loss=0.2664
+ throughput/total_tokens=307,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1600/500000]
+ optim/total_grad_norm=4.048
+ train/ActionNoiseL2Loss=0.2094
+ throughput/total_tokens=307,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1601/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=307,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1602/500000]
+ train/ActionNoiseL2Loss=0.1794
+ throughput/total_tokens=307,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1603/500000]
+ train/ActionNoiseL2Loss=0.1667
+ throughput/total_tokens=307,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1604/500000]
+ train/ActionNoiseL2Loss=0.2157
+ throughput/total_tokens=307,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1605/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=308,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1606/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=308,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1607/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=308,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1608/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=308,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1609/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=308,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1610/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=309,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1611/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=309,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1612/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=309,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1613/500000]
+ train/ActionNoiseL2Loss=0.2392
+ throughput/total_tokens=309,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1614/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=309,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1615/500000]
+ train/ActionNoiseL2Loss=0.1566
+ throughput/total_tokens=310,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1616/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=310,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1617/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=310,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1618/500000]
+ train/ActionNoiseL2Loss=0.1830
+ throughput/total_tokens=310,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1619/500000]
+ train/ActionNoiseL2Loss=0.1954
+ throughput/total_tokens=310,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1620/500000]
+ optim/total_grad_norm=2.851
+ train/ActionNoiseL2Loss=0.1240
+ throughput/total_tokens=311,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1621/500000]
+ train/ActionNoiseL2Loss=0.1747
+ throughput/total_tokens=311,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1622/500000]
+ train/ActionNoiseL2Loss=0.1794
+ throughput/total_tokens=311,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1623/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=311,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1624/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=311,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1625/500000]
+ train/ActionNoiseL2Loss=0.1896
+ throughput/total_tokens=312,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1626/500000]
+ train/ActionNoiseL2Loss=0.1424
+ throughput/total_tokens=312,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1627/500000]
+ train/ActionNoiseL2Loss=0.1712
+ throughput/total_tokens=312,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1628/500000]
+ train/ActionNoiseL2Loss=0.2509
+ throughput/total_tokens=312,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1629/500000]
+ train/ActionNoiseL2Loss=0.1614
+ throughput/total_tokens=312,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1630/500000]
+ train/ActionNoiseL2Loss=0.1503
+ throughput/total_tokens=312,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1631/500000]
+ train/ActionNoiseL2Loss=0.1834
+ throughput/total_tokens=313,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1632/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=313,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1633/500000]
+ train/ActionNoiseL2Loss=0.2052
+ throughput/total_tokens=313,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1634/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=313,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1635/500000]
+ train/ActionNoiseL2Loss=0.2382
+ throughput/total_tokens=313,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1636/500000]
+ train/ActionNoiseL2Loss=0.2488
+ throughput/total_tokens=314,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1637/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=314,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1638/500000]
+ train/ActionNoiseL2Loss=0.2883
+ throughput/total_tokens=314,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1639/500000]
+ train/ActionNoiseL2Loss=0.1667
+ throughput/total_tokens=314,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1640/500000]
+ optim/total_grad_norm=3.645
+ train/ActionNoiseL2Loss=0.1725
+ throughput/total_tokens=314,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1641/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=315,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1642/500000]
+ train/ActionNoiseL2Loss=0.2371
+ throughput/total_tokens=315,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1643/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=315,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1644/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=315,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1645/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=315,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1646/500000]
+ train/ActionNoiseL2Loss=0.1492
+ throughput/total_tokens=316,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1647/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=316,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1648/500000]
+ train/ActionNoiseL2Loss=0.1532
+ throughput/total_tokens=316,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1649/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=316,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1650/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=316,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1651/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=316,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1652/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=317,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1653/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=317,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1654/500000]
+ train/ActionNoiseL2Loss=0.2424
+ throughput/total_tokens=317,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1655/500000]
+ train/ActionNoiseL2Loss=0.2133
+ throughput/total_tokens=317,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1656/500000]
+ train/ActionNoiseL2Loss=0.2833
+ throughput/total_tokens=317,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1657/500000]
+ train/ActionNoiseL2Loss=0.1977
+ throughput/total_tokens=318,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1658/500000]
+ train/ActionNoiseL2Loss=0.2107
+ throughput/total_tokens=318,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1659/500000]
+ train/ActionNoiseL2Loss=0.1419
+ throughput/total_tokens=318,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1660/500000]
+ optim/total_grad_norm=3.408
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=318,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1661/500000]
+ train/ActionNoiseL2Loss=0.2624
+ throughput/total_tokens=318,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1662/500000]
+ train/ActionNoiseL2Loss=0.1954
+ throughput/total_tokens=319,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1663/500000]
+ train/ActionNoiseL2Loss=0.2569
+ throughput/total_tokens=319,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1664/500000]
+ train/ActionNoiseL2Loss=0.2528
+ throughput/total_tokens=319,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1665/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=319,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1666/500000]
+ train/ActionNoiseL2Loss=0.1496
+ throughput/total_tokens=319,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1667/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=320,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1668/500000]
+ train/ActionNoiseL2Loss=0.2685
+ throughput/total_tokens=320,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1669/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=320,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1670/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=320,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1671/500000]
+ train/ActionNoiseL2Loss=0.1276
+ throughput/total_tokens=320,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1672/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=321,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1673/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=321,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1674/500000]
+ train/ActionNoiseL2Loss=0.2039
+ throughput/total_tokens=321,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1675/500000]
+ train/ActionNoiseL2Loss=0.2251
+ throughput/total_tokens=321,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1676/500000]
+ train/ActionNoiseL2Loss=0.2088
+ throughput/total_tokens=321,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1677/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=321,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1678/500000]
+ train/ActionNoiseL2Loss=0.1829
+ throughput/total_tokens=322,176,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1679/500000]
+ train/ActionNoiseL2Loss=0.2157
+ throughput/total_tokens=322,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1680/500000]
+ optim/total_grad_norm=3.106
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=322,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1681/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=322,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1682/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=322,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1683/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=323,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1684/500000]
+ train/ActionNoiseL2Loss=0.1938
+ throughput/total_tokens=323,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1685/500000]
+ train/ActionNoiseL2Loss=0.2696
+ throughput/total_tokens=323,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1686/500000]
+ train/ActionNoiseL2Loss=0.1443
+ throughput/total_tokens=323,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1687/500000]
+ train/ActionNoiseL2Loss=0.1955
+ throughput/total_tokens=323,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1688/500000]
+ train/ActionNoiseL2Loss=0.2305
+ throughput/total_tokens=324,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1689/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=324,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1690/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=324,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1691/500000]
+ train/ActionNoiseL2Loss=0.1724
+ throughput/total_tokens=324,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1692/500000]
+ train/ActionNoiseL2Loss=0.2136
+ throughput/total_tokens=324,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1693/500000]
+ train/ActionNoiseL2Loss=0.2673
+ throughput/total_tokens=325,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1694/500000]
+ train/ActionNoiseL2Loss=0.1773
+ throughput/total_tokens=325,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1695/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=325,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1696/500000]
+ train/ActionNoiseL2Loss=0.2410
+ throughput/total_tokens=325,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1697/500000]
+ train/ActionNoiseL2Loss=0.2440
+ throughput/total_tokens=325,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1698/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=326,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1699/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=326,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1700/500000]
+ optim/total_grad_norm=3.445
+ train/ActionNoiseL2Loss=0.1859
+ throughput/total_tokens=326,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1701/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=326,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1702/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=326,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1703/500000]
+ train/ActionNoiseL2Loss=0.1986
+ throughput/total_tokens=326,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1704/500000]
+ train/ActionNoiseL2Loss=0.1647
+ throughput/total_tokens=327,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1705/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=327,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1706/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=327,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1707/500000]
+ train/ActionNoiseL2Loss=0.2285
+ throughput/total_tokens=327,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1708/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=327,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1709/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=328,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1710/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=328,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1711/500000]
+ train/ActionNoiseL2Loss=0.2008
+ throughput/total_tokens=328,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1712/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=328,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1713/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=328,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1714/500000]
+ train/ActionNoiseL2Loss=0.3293
+ throughput/total_tokens=329,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1715/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=329,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1716/500000]
+ train/ActionNoiseL2Loss=0.1860
+ throughput/total_tokens=329,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1717/500000]
+ train/ActionNoiseL2Loss=0.2071
+ throughput/total_tokens=329,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1718/500000]
+ train/ActionNoiseL2Loss=0.1569
+ throughput/total_tokens=329,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1719/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=330,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1720/500000]
+ optim/total_grad_norm=3.239
+ train/ActionNoiseL2Loss=0.1777
+ throughput/total_tokens=330,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1721/500000]
+ train/ActionNoiseL2Loss=0.1958
+ throughput/total_tokens=330,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1722/500000]
+ train/ActionNoiseL2Loss=0.1316
+ throughput/total_tokens=330,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1723/500000]
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=330,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1724/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=331,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1725/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=331,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1726/500000]
+ train/ActionNoiseL2Loss=0.2023
+ throughput/total_tokens=331,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1727/500000]
+ train/ActionNoiseL2Loss=0.1762
+ throughput/total_tokens=331,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1728/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=331,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1729/500000]
+ train/ActionNoiseL2Loss=0.1819
+ throughput/total_tokens=331,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1730/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=332,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1731/500000]
+ train/ActionNoiseL2Loss=0.1959
+ throughput/total_tokens=332,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1732/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=332,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1733/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=332,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1734/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=332,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1735/500000]
+ train/ActionNoiseL2Loss=0.2512
+ throughput/total_tokens=333,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1736/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=333,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1737/500000]
+ train/ActionNoiseL2Loss=0.1521
+ throughput/total_tokens=333,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1738/500000]
+ train/ActionNoiseL2Loss=0.2100
+ throughput/total_tokens=333,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1739/500000]
+ train/ActionNoiseL2Loss=0.1748
+ throughput/total_tokens=333,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1740/500000]
+ optim/total_grad_norm=2.299
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=334,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1741/500000]
+ train/ActionNoiseL2Loss=0.2296
+ throughput/total_tokens=334,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1742/500000]
+ train/ActionNoiseL2Loss=0.1802
+ throughput/total_tokens=334,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1743/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=334,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1744/500000]
+ train/ActionNoiseL2Loss=0.1483
+ throughput/total_tokens=334,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1745/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=335,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1746/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=335,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1747/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=335,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1748/500000]
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=335,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1749/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=335,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1750/500000]
+ train/ActionNoiseL2Loss=0.2885
+ throughput/total_tokens=336,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1751/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=336,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1752/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=336,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1753/500000]
+ train/ActionNoiseL2Loss=0.1614
+ throughput/total_tokens=336,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1754/500000]
+ train/ActionNoiseL2Loss=0.2724
+ throughput/total_tokens=336,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1755/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=336,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1756/500000]
+ train/ActionNoiseL2Loss=0.1858
+ throughput/total_tokens=337,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1757/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=337,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1758/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=337,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1759/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=337,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1760/500000]
+ optim/total_grad_norm=2.506
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=337,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1761/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=338,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1762/500000]
+ train/ActionNoiseL2Loss=0.1947
+ throughput/total_tokens=338,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1763/500000]
+ train/ActionNoiseL2Loss=0.2529
+ throughput/total_tokens=338,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1764/500000]
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=338,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1765/500000]
+ train/ActionNoiseL2Loss=0.1747
+ throughput/total_tokens=338,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1766/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=339,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1767/500000]
+ train/ActionNoiseL2Loss=0.1957
+ throughput/total_tokens=339,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1768/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=339,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1769/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=339,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1770/500000]
+ train/ActionNoiseL2Loss=0.1473
+ throughput/total_tokens=339,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1771/500000]
+ train/ActionNoiseL2Loss=0.1930
+ throughput/total_tokens=340,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1772/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=340,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1773/500000]
+ train/ActionNoiseL2Loss=0.2295
+ throughput/total_tokens=340,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1774/500000]
+ train/ActionNoiseL2Loss=0.2468
+ throughput/total_tokens=340,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1775/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=340,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1776/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=340,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1777/500000]
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=341,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1778/500000]
+ train/ActionNoiseL2Loss=0.2233
+ throughput/total_tokens=341,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1779/500000]
+ train/ActionNoiseL2Loss=0.2131
+ throughput/total_tokens=341,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1780/500000]
+ optim/total_grad_norm=2.776
+ train/ActionNoiseL2Loss=0.1589
+ throughput/total_tokens=341,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1781/500000]
+ train/ActionNoiseL2Loss=0.1838
+ throughput/total_tokens=341,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1782/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=342,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1783/500000]
+ train/ActionNoiseL2Loss=0.2075
+ throughput/total_tokens=342,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1784/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=342,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1785/500000]
+ train/ActionNoiseL2Loss=0.2786
+ throughput/total_tokens=342,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1786/500000]
+ train/ActionNoiseL2Loss=0.1883
+ throughput/total_tokens=342,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1787/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=343,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1788/500000]
+ train/ActionNoiseL2Loss=0.1762
+ throughput/total_tokens=343,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1789/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=343,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1790/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=343,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1791/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=343,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1792/500000]
+ train/ActionNoiseL2Loss=0.1539
+ throughput/total_tokens=344,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1793/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=344,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1794/500000]
+ train/ActionNoiseL2Loss=0.1748
+ throughput/total_tokens=344,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1795/500000]
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=344,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1796/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=344,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1797/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=345,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1798/500000]
+ train/ActionNoiseL2Loss=0.1417
+ throughput/total_tokens=345,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1799/500000]
+ train/ActionNoiseL2Loss=0.1554
+ throughput/total_tokens=345,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1800/500000]
+ optim/total_grad_norm=2.358
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=345,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1801/500000]
+ train/ActionNoiseL2Loss=0.2131
+ throughput/total_tokens=345,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1802/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=345,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1803/500000]
+ train/ActionNoiseL2Loss=0.1545
+ throughput/total_tokens=346,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1804/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=346,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1805/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=346,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1806/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=346,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1807/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=346,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1808/500000]
+ train/ActionNoiseL2Loss=0.1239
+ throughput/total_tokens=347,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1809/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=347,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1810/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=347,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1811/500000]
+ train/ActionNoiseL2Loss=0.1533
+ throughput/total_tokens=347,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1812/500000]
+ train/ActionNoiseL2Loss=0.1894
+ throughput/total_tokens=347,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1813/500000]
+ train/ActionNoiseL2Loss=0.1526
+ throughput/total_tokens=348,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1814/500000]
+ train/ActionNoiseL2Loss=0.2440
+ throughput/total_tokens=348,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1815/500000]
+ train/ActionNoiseL2Loss=0.1409
+ throughput/total_tokens=348,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1816/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=348,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1817/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=348,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1818/500000]
+ train/ActionNoiseL2Loss=0.1750
+ throughput/total_tokens=349,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1819/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=349,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1820/500000]
+ optim/total_grad_norm=3.098
+ train/ActionNoiseL2Loss=0.2268
+ throughput/total_tokens=349,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1821/500000]
+ train/ActionNoiseL2Loss=0.1968
+ throughput/total_tokens=349,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1822/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=349,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1823/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=350,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1824/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=350,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1825/500000]
+ train/ActionNoiseL2Loss=0.1561
+ throughput/total_tokens=350,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1826/500000]
+ train/ActionNoiseL2Loss=0.2937
+ throughput/total_tokens=350,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1827/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=350,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1828/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=350,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1829/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=351,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1830/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=351,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1831/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=351,552,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1832/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=351,744,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1833/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=351,936,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1834/500000]
+ train/ActionNoiseL2Loss=0.1990
+ throughput/total_tokens=352,128,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1835/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=352,320,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1836/500000]
+ train/ActionNoiseL2Loss=0.2149
+ throughput/total_tokens=352,512,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1837/500000]
+ train/ActionNoiseL2Loss=0.1569
+ throughput/total_tokens=352,704,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1838/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=352,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1839/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=353,088,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1840/500000]
+ optim/total_grad_norm=3.285
+ train/ActionNoiseL2Loss=0.2006
+ throughput/total_tokens=353,280,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1841/500000]
+ train/ActionNoiseL2Loss=0.1476
+ throughput/total_tokens=353,472,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1842/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=353,664,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1843/500000]
+ train/ActionNoiseL2Loss=0.2170
+ throughput/total_tokens=353,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1844/500000]
+ train/ActionNoiseL2Loss=0.3199
+ throughput/total_tokens=354,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1845/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=354,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1846/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=354,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1847/500000]
+ train/ActionNoiseL2Loss=0.1393
+ throughput/total_tokens=354,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1848/500000]
+ train/ActionNoiseL2Loss=0.1462
+ throughput/total_tokens=354,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1849/500000]
+ train/ActionNoiseL2Loss=0.1892
+ throughput/total_tokens=355,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1850/500000]
+ train/ActionNoiseL2Loss=0.2952
+ throughput/total_tokens=355,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1851/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=355,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1852/500000]
+ train/ActionNoiseL2Loss=0.1677
+ throughput/total_tokens=355,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1853/500000]
+ train/ActionNoiseL2Loss=0.1876
+ throughput/total_tokens=355,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1854/500000]
+ train/ActionNoiseL2Loss=0.1908
+ throughput/total_tokens=355,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1855/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=356,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1856/500000]
+ train/ActionNoiseL2Loss=0.2096
+ throughput/total_tokens=356,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1857/500000]
+ train/ActionNoiseL2Loss=0.2379
+ throughput/total_tokens=356,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1858/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=356,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1859/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=356,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1860/500000]
+ optim/total_grad_norm=3.353
+ train/ActionNoiseL2Loss=0.2395
+ throughput/total_tokens=357,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1861/500000]
+ train/ActionNoiseL2Loss=0.1373
+ throughput/total_tokens=357,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1862/500000]
+ train/ActionNoiseL2Loss=0.1834
+ throughput/total_tokens=357,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1863/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=357,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1864/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=357,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1865/500000]
+ train/ActionNoiseL2Loss=0.1926
+ throughput/total_tokens=358,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1866/500000]
+ train/ActionNoiseL2Loss=0.1945
+ throughput/total_tokens=358,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1867/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=358,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1868/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=358,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1869/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=358,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=1870/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=359,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=1871/500000]
+ train/ActionNoiseL2Loss=0.1763
+ throughput/total_tokens=359,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1872/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=359,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1873/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=359,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1874/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=359,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1875/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=360,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1876/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=360,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1877/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=360,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1878/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=360,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=1879/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=360,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1880/500000]
+ optim/total_grad_norm=2.754
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=360,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1881/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=361,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1882/500000]
+ train/ActionNoiseL2Loss=0.2679
+ throughput/total_tokens=361,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1883/500000]
+ train/ActionNoiseL2Loss=0.2055
+ throughput/total_tokens=361,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1884/500000]
+ train/ActionNoiseL2Loss=0.1351
+ throughput/total_tokens=361,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1885/500000]
+ train/ActionNoiseL2Loss=0.1754
+ throughput/total_tokens=361,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1886/500000]
+ train/ActionNoiseL2Loss=0.1935
+ throughput/total_tokens=362,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1887/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=362,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1888/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=362,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1889/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=362,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1890/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=362,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1891/500000]
+ train/ActionNoiseL2Loss=0.2162
+ throughput/total_tokens=363,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1892/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=363,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1893/500000]
+ train/ActionNoiseL2Loss=0.1682
+ throughput/total_tokens=363,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1894/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=363,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1895/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=363,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1896/500000]
+ train/ActionNoiseL2Loss=0.2370
+ throughput/total_tokens=364,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1897/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=364,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1898/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=364,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1899/500000]
+ train/ActionNoiseL2Loss=0.2865
+ throughput/total_tokens=364,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1900/500000]
+ optim/total_grad_norm=3.136
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=364,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1901/500000]
+ train/ActionNoiseL2Loss=0.2733
+ throughput/total_tokens=364,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1902/500000]
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=365,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1903/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=365,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1904/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=365,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1905/500000]
+ train/ActionNoiseL2Loss=0.2114
+ throughput/total_tokens=365,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1906/500000]
+ train/ActionNoiseL2Loss=0.1751
+ throughput/total_tokens=365,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1907/500000]
+ train/ActionNoiseL2Loss=0.2110
+ throughput/total_tokens=366,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1908/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=366,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1909/500000]
+ train/ActionNoiseL2Loss=0.1925
+ throughput/total_tokens=366,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1910/500000]
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=366,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1911/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=366,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1912/500000]
+ train/ActionNoiseL2Loss=0.2215
+ throughput/total_tokens=367,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1913/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=367,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1914/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=367,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1915/500000]
+ train/ActionNoiseL2Loss=0.2132
+ throughput/total_tokens=367,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1916/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=367,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1917/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=368,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1918/500000]
+ train/ActionNoiseL2Loss=0.1570
+ throughput/total_tokens=368,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1919/500000]
+ train/ActionNoiseL2Loss=0.1543
+ throughput/total_tokens=368,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1920/500000]
+ optim/total_grad_norm=3.834
+ train/ActionNoiseL2Loss=0.1886
+ throughput/total_tokens=368,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1921/500000]
+ train/ActionNoiseL2Loss=0.2003
+ throughput/total_tokens=368,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1922/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=369,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1923/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=369,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1924/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=369,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1925/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=369,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1926/500000]
+ train/ActionNoiseL2Loss=0.2936
+ throughput/total_tokens=369,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1927/500000]
+ train/ActionNoiseL2Loss=0.2012
+ throughput/total_tokens=369,984,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1928/500000]
+ train/ActionNoiseL2Loss=0.1938
+ throughput/total_tokens=370,176,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1929/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=370,368,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1930/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=370,560,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1931/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=370,752,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1932/500000]
+ train/ActionNoiseL2Loss=0.1734
+ throughput/total_tokens=370,944,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1933/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=371,136,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1934/500000]
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=371,328,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1935/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=371,520,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1936/500000]
+ train/ActionNoiseL2Loss=0.1276
+ throughput/total_tokens=371,712,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1937/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=371,904,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1938/500000]
+ train/ActionNoiseL2Loss=0.1919
+ throughput/total_tokens=372,096,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1939/500000]
+ train/ActionNoiseL2Loss=0.2303
+ throughput/total_tokens=372,288,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1940/500000]
+ optim/total_grad_norm=3.759
+ train/ActionNoiseL2Loss=0.2013
+ throughput/total_tokens=372,480,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1941/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=372,672,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1942/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=372,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1943/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=373,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1944/500000]
+ train/ActionNoiseL2Loss=0.1597
+ throughput/total_tokens=373,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1945/500000]
+ train/ActionNoiseL2Loss=0.2111
+ throughput/total_tokens=373,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1946/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=373,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1947/500000]
+ train/ActionNoiseL2Loss=0.1857
+ throughput/total_tokens=373,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1948/500000]
+ train/ActionNoiseL2Loss=0.1191
+ throughput/total_tokens=374,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1949/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=374,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1950/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=374,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1951/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=374,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1952/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=374,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1953/500000]
+ train/ActionNoiseL2Loss=0.2154
+ throughput/total_tokens=374,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1954/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=375,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1955/500000]
+ train/ActionNoiseL2Loss=0.1447
+ throughput/total_tokens=375,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1956/500000]
+ train/ActionNoiseL2Loss=0.1678
+ throughput/total_tokens=375,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1957/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=375,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1958/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=375,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1959/500000]
+ train/ActionNoiseL2Loss=0.1891
+ throughput/total_tokens=376,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1960/500000]
+ optim/total_grad_norm=3.503
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=376,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1961/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=376,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1962/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=376,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1963/500000]
+ train/ActionNoiseL2Loss=0.1915
+ throughput/total_tokens=376,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1964/500000]
+ train/ActionNoiseL2Loss=0.1469
+ throughput/total_tokens=377,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1965/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=377,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1966/500000]
+ train/ActionNoiseL2Loss=0.1444
+ throughput/total_tokens=377,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1967/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=377,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1968/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=377,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1969/500000]
+ train/ActionNoiseL2Loss=0.1379
+ throughput/total_tokens=378,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1970/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=378,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1971/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=378,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1972/500000]
+ train/ActionNoiseL2Loss=0.2332
+ throughput/total_tokens=378,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1973/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=378,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=1974/500000]
+ train/ActionNoiseL2Loss=0.2706
+ throughput/total_tokens=379,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1975/500000]
+ train/ActionNoiseL2Loss=0.1880
+ throughput/total_tokens=379,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1976/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=379,392,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1977/500000]
+ train/ActionNoiseL2Loss=0.1649
+ throughput/total_tokens=379,584,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1978/500000]
+ train/ActionNoiseL2Loss=0.1813
+ throughput/total_tokens=379,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1979/500000]
+ train/ActionNoiseL2Loss=0.2110
+ throughput/total_tokens=379,968,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1980/500000]
+ optim/total_grad_norm=2.936
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=380,160,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1981/500000]
+ train/ActionNoiseL2Loss=0.1967
+ throughput/total_tokens=380,352,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1982/500000]
+ train/ActionNoiseL2Loss=0.1848
+ throughput/total_tokens=380,544,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1983/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=380,736,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1984/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=380,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1985/500000]
+ train/ActionNoiseL2Loss=0.1960
+ throughput/total_tokens=381,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1986/500000]
+ train/ActionNoiseL2Loss=0.1994
+ throughput/total_tokens=381,312,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1987/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=381,504,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1988/500000]
+ train/ActionNoiseL2Loss=0.1894
+ throughput/total_tokens=381,696,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1989/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=381,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1990/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=382,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=1991/500000]
+ train/ActionNoiseL2Loss=0.2188
+ throughput/total_tokens=382,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1992/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=382,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1993/500000]
+ train/ActionNoiseL2Loss=0.1668
+ throughput/total_tokens=382,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1994/500000]
+ train/ActionNoiseL2Loss=0.2299
+ throughput/total_tokens=382,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1995/500000]
+ train/ActionNoiseL2Loss=0.2646
+ throughput/total_tokens=383,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1996/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=383,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1997/500000]
+ train/ActionNoiseL2Loss=0.2340
+ throughput/total_tokens=383,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1998/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=383,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1999/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=383,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2000/500000]
+ optim/total_grad_norm=2.550
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=384,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+10/03 [04:31:59] INFO | >> Saving config... checkpoint.py:608
+10/03 [04:32:40] INFO | >> Saving model state... checkpoint.py:796
+10/03 [04:33:53] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [04:35:26] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2001/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=384,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2002/500000]
+ train/ActionNoiseL2Loss=0.2314
+ throughput/total_tokens=384,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2003/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=384,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2004/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=384,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2005/500000]
+ train/ActionNoiseL2Loss=0.2396
+ throughput/total_tokens=384,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2006/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=385,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2007/500000]
+ train/ActionNoiseL2Loss=0.1559
+ throughput/total_tokens=385,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2008/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=385,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2009/500000]
+ train/ActionNoiseL2Loss=0.2068
+ throughput/total_tokens=385,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2010/500000]
+ train/ActionNoiseL2Loss=0.1671
+ throughput/total_tokens=385,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2011/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=386,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2012/500000]
+ train/ActionNoiseL2Loss=0.2284
+ throughput/total_tokens=386,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2013/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=386,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2014/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=386,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2015/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=386,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2016/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=387,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2017/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=387,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2018/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=387,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2019/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=387,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2020/500000]
+ optim/total_grad_norm=3.453
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=387,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2021/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=388,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2022/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=388,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2023/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=388,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2024/500000]
+ train/ActionNoiseL2Loss=0.1721
+ throughput/total_tokens=388,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2025/500000]
+ train/ActionNoiseL2Loss=0.2075
+ throughput/total_tokens=388,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2026/500000]
+ train/ActionNoiseL2Loss=0.1427
+ throughput/total_tokens=388,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2027/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=389,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2028/500000]
+ train/ActionNoiseL2Loss=0.1513
+ throughput/total_tokens=389,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2029/500000]
+ train/ActionNoiseL2Loss=0.1665
+ throughput/total_tokens=389,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2030/500000]
+ train/ActionNoiseL2Loss=0.1458
+ throughput/total_tokens=389,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2031/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=389,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2032/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=390,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2033/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=390,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2034/500000]
+ train/ActionNoiseL2Loss=0.2753
+ throughput/total_tokens=390,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2035/500000]
+ train/ActionNoiseL2Loss=0.1774
+ throughput/total_tokens=390,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2036/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=390,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2037/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=391,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2038/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=391,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2039/500000]
+ train/ActionNoiseL2Loss=0.2541
+ throughput/total_tokens=391,488,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2040/500000]
+ optim/total_grad_norm=3.305
+ train/ActionNoiseL2Loss=0.1934
+ throughput/total_tokens=391,680,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2041/500000]
+ train/ActionNoiseL2Loss=0.1702
+ throughput/total_tokens=391,872,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2042/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=392,064,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2043/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=392,256,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2044/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=392,448,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2045/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=392,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2046/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=392,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2047/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=393,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2048/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=393,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2049/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=393,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2050/500000]
+ train/ActionNoiseL2Loss=0.1901
+ throughput/total_tokens=393,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2051/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=393,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2052/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=393,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2053/500000]
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=394,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2054/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=394,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2055/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=394,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2056/500000]
+ train/ActionNoiseL2Loss=0.1367
+ throughput/total_tokens=394,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2057/500000]
+ train/ActionNoiseL2Loss=0.2049
+ throughput/total_tokens=394,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2058/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=395,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2059/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=395,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2060/500000]
+ optim/total_grad_norm=2.736
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=395,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2061/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=395,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2062/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=395,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2063/500000]
+ train/ActionNoiseL2Loss=0.1966
+ throughput/total_tokens=396,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2064/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=396,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2065/500000]
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=396,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2066/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=396,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2067/500000]
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=396,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2068/500000]
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=397,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2069/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=397,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2070/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=397,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2071/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=397,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2072/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=397,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2073/500000]
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=398,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2074/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=398,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2075/500000]
+ train/ActionNoiseL2Loss=0.1646
+ throughput/total_tokens=398,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2076/500000]
+ train/ActionNoiseL2Loss=0.1733
+ throughput/total_tokens=398,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2077/500000]
+ train/ActionNoiseL2Loss=0.2151
+ throughput/total_tokens=398,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2078/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=398,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2079/500000]
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=399,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2080/500000]
+ optim/total_grad_norm=2.641
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=399,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2081/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=399,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2082/500000]
+ train/ActionNoiseL2Loss=0.2861
+ throughput/total_tokens=399,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2083/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=399,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2084/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=400,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2085/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=400,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2086/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=400,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2087/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=400,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2088/500000]
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=400,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2089/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=401,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2090/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=401,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2091/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=401,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2092/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=401,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2093/500000]
+ train/ActionNoiseL2Loss=0.2376
+ throughput/total_tokens=401,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2094/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=402,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2095/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=402,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2096/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=402,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2097/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=402,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2098/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=402,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2099/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=403,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2100/500000]
+ optim/total_grad_norm=2.563
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=403,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2101/500000]
+ train/ActionNoiseL2Loss=0.2602
+ throughput/total_tokens=403,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2102/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=403,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2103/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=403,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2104/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=403,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2105/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=404,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2106/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=404,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2107/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=404,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2108/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=404,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2109/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=404,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2110/500000]
+ train/ActionNoiseL2Loss=0.1799
+ throughput/total_tokens=405,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2111/500000]
+ train/ActionNoiseL2Loss=0.1902
+ throughput/total_tokens=405,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2112/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=405,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2113/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=405,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2114/500000]
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=405,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2115/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=406,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2116/500000]
+ train/ActionNoiseL2Loss=0.1798
+ throughput/total_tokens=406,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2117/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=406,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2118/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=406,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2119/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=406,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2120/500000]
+ optim/total_grad_norm=1.990
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=407,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2121/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=407,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2122/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=407,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2123/500000]
+ train/ActionNoiseL2Loss=0.1754
+ throughput/total_tokens=407,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2124/500000]
+ train/ActionNoiseL2Loss=0.1406
+ throughput/total_tokens=407,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2125/500000]
+ train/ActionNoiseL2Loss=0.1601
+ throughput/total_tokens=408,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2126/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=408,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2127/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=408,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2128/500000]
+ train/ActionNoiseL2Loss=0.1373
+ throughput/total_tokens=408,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2129/500000]
+ train/ActionNoiseL2Loss=0.1485
+ throughput/total_tokens=408,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2130/500000]
+ train/ActionNoiseL2Loss=0.1525
+ throughput/total_tokens=408,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2131/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=409,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2132/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=409,344,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2133/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=409,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2134/500000]
+ train/ActionNoiseL2Loss=0.2078
+ throughput/total_tokens=409,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2135/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=409,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2136/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=410,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2137/500000]
+ train/ActionNoiseL2Loss=0.1916
+ throughput/total_tokens=410,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2138/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=410,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2139/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=410,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2140/500000]
+ optim/total_grad_norm=3.325
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=410,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2141/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=411,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2142/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=411,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2143/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=411,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2144/500000]
+ train/ActionNoiseL2Loss=0.2049
+ throughput/total_tokens=411,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2145/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=411,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2146/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=412,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2147/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=412,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2148/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=412,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2149/500000]
+ train/ActionNoiseL2Loss=0.1743
+ throughput/total_tokens=412,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2150/500000]
+ train/ActionNoiseL2Loss=0.2883
+ throughput/total_tokens=412,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2151/500000]
+ train/ActionNoiseL2Loss=0.1627
+ throughput/total_tokens=412,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2152/500000]
+ train/ActionNoiseL2Loss=0.2241
+ throughput/total_tokens=413,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2153/500000]
+ train/ActionNoiseL2Loss=0.1665
+ throughput/total_tokens=413,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2154/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=413,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2155/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=413,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2156/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=413,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2157/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=414,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2158/500000]
+ train/ActionNoiseL2Loss=0.1796
+ throughput/total_tokens=414,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2159/500000]
+ train/ActionNoiseL2Loss=0.1949
+ throughput/total_tokens=414,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2160/500000]
+ optim/total_grad_norm=2.837
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=414,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2161/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=414,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2162/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=415,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2163/500000]
+ train/ActionNoiseL2Loss=0.1488
+ throughput/total_tokens=415,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2164/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=415,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2165/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=415,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2166/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=415,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2167/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=416,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2168/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=416,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2169/500000]
+ train/ActionNoiseL2Loss=0.1953
+ throughput/total_tokens=416,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2170/500000]
+ train/ActionNoiseL2Loss=0.1612
+ throughput/total_tokens=416,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2171/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=416,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2172/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=417,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2173/500000]
+ train/ActionNoiseL2Loss=0.1610
+ throughput/total_tokens=417,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2174/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=417,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2175/500000]
+ train/ActionNoiseL2Loss=0.1727
+ throughput/total_tokens=417,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2176/500000]
+ train/ActionNoiseL2Loss=0.2115
+ throughput/total_tokens=417,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2177/500000]
+ train/ActionNoiseL2Loss=0.2635
+ throughput/total_tokens=417,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2178/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=418,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2179/500000]
+ train/ActionNoiseL2Loss=0.2706
+ throughput/total_tokens=418,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2180/500000]
+ optim/total_grad_norm=2.374
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=418,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2181/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=418,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2182/500000]
+ train/ActionNoiseL2Loss=0.1295
+ throughput/total_tokens=418,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2183/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=419,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2184/500000]
+ train/ActionNoiseL2Loss=0.1724
+ throughput/total_tokens=419,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2185/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=419,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2186/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=419,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2187/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=419,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2188/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=420,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2189/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=420,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2190/500000]
+ train/ActionNoiseL2Loss=0.1752
+ throughput/total_tokens=420,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2191/500000]
+ train/ActionNoiseL2Loss=0.1466
+ throughput/total_tokens=420,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2192/500000]
+ train/ActionNoiseL2Loss=0.2163
+ throughput/total_tokens=420,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2193/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=421,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2194/500000]
+ train/ActionNoiseL2Loss=0.2099
+ throughput/total_tokens=421,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2195/500000]
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=421,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2196/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=421,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2197/500000]
+ train/ActionNoiseL2Loss=0.1881
+ throughput/total_tokens=421,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2198/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=422,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2199/500000]
+ train/ActionNoiseL2Loss=0.1501
+ throughput/total_tokens=422,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2200/500000]
+ optim/total_grad_norm=3.162
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=422,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2201/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=422,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2202/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=422,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2203/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=422,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2204/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=423,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2205/500000]
+ train/ActionNoiseL2Loss=0.1800
+ throughput/total_tokens=423,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2206/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=423,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2207/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=423,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2208/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=423,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2209/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=424,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2210/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=424,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2211/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=424,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2212/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=424,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2213/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=424,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2214/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=425,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2215/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=425,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2216/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=425,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2217/500000]
+ train/ActionNoiseL2Loss=0.2062
+ throughput/total_tokens=425,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2218/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=425,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2219/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=426,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2220/500000]
+ optim/total_grad_norm=2.011
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=426,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2221/500000]
+ train/ActionNoiseL2Loss=0.1372
+ throughput/total_tokens=426,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2222/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=426,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2223/500000]
+ train/ActionNoiseL2Loss=0.1973
+ throughput/total_tokens=426,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2224/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=427,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2225/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=427,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2226/500000]
+ train/ActionNoiseL2Loss=0.2457
+ throughput/total_tokens=427,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2227/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=427,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2228/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=427,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2229/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=427,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2230/500000]
+ train/ActionNoiseL2Loss=0.1914
+ throughput/total_tokens=428,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2231/500000]
+ train/ActionNoiseL2Loss=0.1911
+ throughput/total_tokens=428,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2232/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=428,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2233/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=428,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2234/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=428,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2235/500000]
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=429,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2236/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=429,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2237/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=429,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2238/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=429,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2239/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=429,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2240/500000]
+ optim/total_grad_norm=2.990
+ train/ActionNoiseL2Loss=0.2000
+ throughput/total_tokens=430,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2241/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=430,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2242/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=430,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2243/500000]
+ train/ActionNoiseL2Loss=0.1763
+ throughput/total_tokens=430,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2244/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=430,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2245/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=431,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2246/500000]
+ train/ActionNoiseL2Loss=0.1776
+ throughput/total_tokens=431,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2247/500000]
+ train/ActionNoiseL2Loss=0.1669
+ throughput/total_tokens=431,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2248/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=431,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2249/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=431,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2250/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=432,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2251/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=432,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2252/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=432,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2253/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=432,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2254/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=432,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2255/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=432,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2256/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=433,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2257/500000]
+ train/ActionNoiseL2Loss=0.1543
+ throughput/total_tokens=433,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2258/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=433,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2259/500000]
+ train/ActionNoiseL2Loss=0.1734
+ throughput/total_tokens=433,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2260/500000]
+ optim/total_grad_norm=2.112
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=433,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2261/500000]
+ train/ActionNoiseL2Loss=0.1535
+ throughput/total_tokens=434,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2262/500000]
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=434,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2263/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=434,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2264/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=434,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2265/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=434,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2266/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=435,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2267/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=435,264,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2268/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=435,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2269/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=435,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2270/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=435,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2271/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=436,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2272/500000]
+ train/ActionNoiseL2Loss=0.1496
+ throughput/total_tokens=436,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2273/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=436,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2274/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=436,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2275/500000]
+ train/ActionNoiseL2Loss=0.1404
+ throughput/total_tokens=436,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2276/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=436,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2277/500000]
+ train/ActionNoiseL2Loss=0.2253
+ throughput/total_tokens=437,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2278/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=437,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2279/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=437,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2280/500000]
+ optim/total_grad_norm=2.304
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=437,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2281/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=437,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2282/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=438,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2283/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=438,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2284/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=438,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2285/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=438,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2286/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=438,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2287/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=439,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2288/500000]
+ train/ActionNoiseL2Loss=0.1676
+ throughput/total_tokens=439,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2289/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=439,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2290/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=439,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2291/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=439,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2292/500000]
+ train/ActionNoiseL2Loss=0.1671
+ throughput/total_tokens=440,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2293/500000]
+ train/ActionNoiseL2Loss=0.1741
+ throughput/total_tokens=440,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2294/500000]
+ train/ActionNoiseL2Loss=0.2102
+ throughput/total_tokens=440,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2295/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=440,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2296/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=440,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2297/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=441,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2298/500000]
+ train/ActionNoiseL2Loss=0.2245
+ throughput/total_tokens=441,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2299/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=441,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2300/500000]
+ optim/total_grad_norm=3.445
+ train/ActionNoiseL2Loss=0.1991
+ throughput/total_tokens=441,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2301/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=441,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2302/500000]
+ train/ActionNoiseL2Loss=0.1797
+ throughput/total_tokens=441,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2303/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=442,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2304/500000]
+ train/ActionNoiseL2Loss=0.2288
+ throughput/total_tokens=442,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2305/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=442,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2306/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=442,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2307/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=442,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2308/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=443,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2309/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=443,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2310/500000]
+ train/ActionNoiseL2Loss=0.1675
+ throughput/total_tokens=443,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2311/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=443,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2312/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=443,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2313/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=444,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2314/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=444,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2315/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=444,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2316/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=444,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2317/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=444,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2318/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=445,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2319/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=445,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2320/500000]
+ optim/total_grad_norm=2.459
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=445,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2321/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=445,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2322/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=445,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2323/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=446,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2324/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=446,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2325/500000]
+ train/ActionNoiseL2Loss=0.1685
+ throughput/total_tokens=446,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2326/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=446,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2327/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=446,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2328/500000]
+ train/ActionNoiseL2Loss=0.1834
+ throughput/total_tokens=446,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2329/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=447,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2330/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=447,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2331/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=447,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2332/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=447,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2333/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=447,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2334/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=448,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2335/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=448,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2336/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=448,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2337/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=448,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2338/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=448,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2339/500000]
+ train/ActionNoiseL2Loss=0.2065
+ throughput/total_tokens=449,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2340/500000]
+ optim/total_grad_norm=3.212
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=449,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2341/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=449,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2342/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=449,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2343/500000]
+ train/ActionNoiseL2Loss=0.1705
+ throughput/total_tokens=449,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2344/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=450,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2345/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=450,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2346/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=450,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2347/500000]
+ train/ActionNoiseL2Loss=0.1545
+ throughput/total_tokens=450,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2348/500000]
+ train/ActionNoiseL2Loss=0.1874
+ throughput/total_tokens=450,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2349/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=451,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2350/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=451,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2351/500000]
+ train/ActionNoiseL2Loss=0.2218
+ throughput/total_tokens=451,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2352/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=451,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2353/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=451,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2354/500000]
+ train/ActionNoiseL2Loss=0.1897
+ throughput/total_tokens=451,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2355/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=452,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2356/500000]
+ train/ActionNoiseL2Loss=0.1697
+ throughput/total_tokens=452,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2357/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=452,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2358/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=452,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2359/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=452,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2360/500000]
+ optim/total_grad_norm=2.203
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=453,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2361/500000]
+ train/ActionNoiseL2Loss=0.1624
+ throughput/total_tokens=453,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2362/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=453,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2363/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=453,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2364/500000]
+ train/ActionNoiseL2Loss=0.1507
+ throughput/total_tokens=453,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2365/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=454,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2366/500000]
+ train/ActionNoiseL2Loss=0.1703
+ throughput/total_tokens=454,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2367/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=454,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2368/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=454,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2369/500000]
+ train/ActionNoiseL2Loss=0.1754
+ throughput/total_tokens=454,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2370/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=455,040,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2371/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=455,232,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2372/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=455,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2373/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=455,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2374/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=455,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2375/500000]
+ train/ActionNoiseL2Loss=0.1953
+ throughput/total_tokens=456,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2376/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=456,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2377/500000]
+ train/ActionNoiseL2Loss=0.2219
+ throughput/total_tokens=456,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2378/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=456,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2379/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=456,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2380/500000]
+ optim/total_grad_norm=2.111
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=456,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2381/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=457,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2382/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=457,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2383/500000]
+ train/ActionNoiseL2Loss=0.1731
+ throughput/total_tokens=457,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2384/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=457,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2385/500000]
+ train/ActionNoiseL2Loss=0.1705
+ throughput/total_tokens=457,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2386/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=458,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2387/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=458,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2388/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=458,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2389/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=458,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2390/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=458,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2391/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=459,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2392/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=459,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2393/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=459,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2394/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=459,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2395/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=459,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2396/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=460,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2397/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=460,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2398/500000]
+ train/ActionNoiseL2Loss=0.1612
+ throughput/total_tokens=460,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2399/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=460,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2400/500000]
+ optim/total_grad_norm=2.639
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=460,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2401/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=460,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2402/500000]
+ train/ActionNoiseL2Loss=0.1774
+ throughput/total_tokens=461,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2403/500000]
+ train/ActionNoiseL2Loss=0.1678
+ throughput/total_tokens=461,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2404/500000]
+ train/ActionNoiseL2Loss=0.1492
+ throughput/total_tokens=461,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2405/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=461,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2406/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=461,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2407/500000]
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=462,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2408/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=462,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2409/500000]
+ train/ActionNoiseL2Loss=0.1483
+ throughput/total_tokens=462,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2410/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=462,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2411/500000]
+ train/ActionNoiseL2Loss=0.2052
+ throughput/total_tokens=462,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2412/500000]
+ train/ActionNoiseL2Loss=0.1536
+ throughput/total_tokens=463,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2413/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=463,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2414/500000]
+ train/ActionNoiseL2Loss=0.1576
+ throughput/total_tokens=463,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2415/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=463,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2416/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=463,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2417/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=464,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2418/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=464,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2419/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=464,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2420/500000]
+ optim/total_grad_norm=2.308
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=464,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2421/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=464,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2422/500000]
+ train/ActionNoiseL2Loss=0.1904
+ throughput/total_tokens=465,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2423/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=465,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2424/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=465,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2425/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=465,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2426/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=465,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2427/500000]
+ train/ActionNoiseL2Loss=0.1580
+ throughput/total_tokens=465,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2428/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=466,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2429/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=466,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2430/500000]
+ train/ActionNoiseL2Loss=0.2406
+ throughput/total_tokens=466,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2431/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=466,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2432/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=466,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2433/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=467,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2434/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=467,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2435/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=467,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2436/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=467,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2437/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=467,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2438/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=468,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2439/500000]
+ train/ActionNoiseL2Loss=0.1448
+ throughput/total_tokens=468,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2440/500000]
+ optim/total_grad_norm=2.293
+ train/ActionNoiseL2Loss=0.1228
+ throughput/total_tokens=468,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2441/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=468,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2442/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=468,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2443/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=469,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2444/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=469,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2445/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=469,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2446/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=469,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2447/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=469,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2448/500000]
+ train/ActionNoiseL2Loss=0.1454
+ throughput/total_tokens=470,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2449/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=470,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2450/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=470,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2451/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=470,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2452/500000]
+ train/ActionNoiseL2Loss=0.1507
+ throughput/total_tokens=470,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2453/500000]
+ train/ActionNoiseL2Loss=0.1525
+ throughput/total_tokens=470,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2454/500000]
+ train/ActionNoiseL2Loss=0.1462
+ throughput/total_tokens=471,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2455/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=471,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2456/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=471,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2457/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=471,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2458/500000]
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=471,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2459/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=472,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2460/500000]
+ optim/total_grad_norm=2.443
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=472,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2461/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=472,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2462/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=472,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2463/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=472,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2464/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=473,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2465/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=473,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2466/500000]
+ train/ActionNoiseL2Loss=0.1642
+ throughput/total_tokens=473,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2467/500000]
+ train/ActionNoiseL2Loss=0.2194
+ throughput/total_tokens=473,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2468/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=473,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2469/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=474,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2470/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=474,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2471/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=474,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2472/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=474,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2473/500000]
+ train/ActionNoiseL2Loss=0.1911
+ throughput/total_tokens=474,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2474/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=475,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2475/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=475,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2476/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=475,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2477/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=475,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2478/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=475,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2479/500000]
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=475,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2480/500000]
+ optim/total_grad_norm=1.411
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=476,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2481/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=476,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2482/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=476,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2483/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=476,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2484/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=476,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2485/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=477,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2486/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=477,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2487/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=477,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2488/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=477,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2489/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=477,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2490/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=478,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2491/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=478,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2492/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=478,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2493/500000]
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=478,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2494/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=478,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2495/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=479,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2496/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=479,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2497/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=479,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2498/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=479,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2499/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=479,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2500/500000]
+ optim/total_grad_norm=2.547
+ train/ActionNoiseL2Loss=0.1427
+ throughput/total_tokens=480,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/03 [07:29:13] INFO | >> Saving config... checkpoint.py:608
+10/03 [07:29:46] INFO | >> Saving model state... checkpoint.py:796
+10/03 [07:31:00] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [07:32:33] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2501/500000]
+ train/ActionNoiseL2Loss=0.1774
+ throughput/total_tokens=480,192,000
+ throughput/device/tokens_per_second=1,195
+ throughput/device/batches_per_second=0.0498
+[step=2502/500000]
+ train/ActionNoiseL2Loss=0.1922
+ throughput/total_tokens=480,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2503/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=480,576,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2504/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=480,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2505/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=480,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2506/500000]
+ train/ActionNoiseL2Loss=0.1239
+ throughput/total_tokens=481,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2507/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=481,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2508/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=481,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2509/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=481,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2510/500000]
+ train/ActionNoiseL2Loss=0.1588
+ throughput/total_tokens=481,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2511/500000]
+ train/ActionNoiseL2Loss=0.1608
+ throughput/total_tokens=482,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2512/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=482,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2513/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=482,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2514/500000]
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=482,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2515/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=482,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2516/500000]
+ train/ActionNoiseL2Loss=0.1455
+ throughput/total_tokens=483,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2517/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=483,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2518/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=483,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2519/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=483,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2520/500000]
+ optim/total_grad_norm=3.307
+ train/ActionNoiseL2Loss=0.1597
+ throughput/total_tokens=483,840,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2521/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=484,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2522/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=484,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2523/500000]
+ train/ActionNoiseL2Loss=0.2110
+ throughput/total_tokens=484,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2524/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=484,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2525/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=484,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2526/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=484,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2527/500000]
+ train/ActionNoiseL2Loss=0.1521
+ throughput/total_tokens=485,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2528/500000]
+ train/ActionNoiseL2Loss=0.1580
+ throughput/total_tokens=485,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2529/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=485,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2530/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=485,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2531/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=485,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2532/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=486,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2533/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=486,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2534/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=486,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2535/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=486,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2536/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=486,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2537/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=487,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2538/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=487,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2539/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=487,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2540/500000]
+ optim/total_grad_norm=2.424
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=487,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2541/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=487,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2542/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=488,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2543/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=488,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2544/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=488,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2545/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=488,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2546/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=488,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2547/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=489,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2548/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=489,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2549/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=489,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2550/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=489,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2551/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=489,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2552/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=489,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2553/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=490,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2554/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=490,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2555/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=490,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2556/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=490,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2557/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=490,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2558/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=491,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2559/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=491,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2560/500000]
+ optim/total_grad_norm=2.278
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=491,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2561/500000]
+ train/ActionNoiseL2Loss=0.1610
+ throughput/total_tokens=491,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2562/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=491,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2563/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=492,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2564/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=492,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2565/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=492,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2566/500000]
+ train/ActionNoiseL2Loss=0.2127
+ throughput/total_tokens=492,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2567/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=492,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2568/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=493,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2569/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=493,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2570/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=493,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2571/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=493,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2572/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=493,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2573/500000]
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=494,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2574/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=494,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2575/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=494,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2576/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=494,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2577/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=494,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2578/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=494,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2579/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=495,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2580/500000]
+ optim/total_grad_norm=2.101
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=495,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2581/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=495,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2582/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=495,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2583/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=495,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2584/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=496,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2585/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=496,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2586/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=496,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2587/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=496,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2588/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=496,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2589/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=497,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2590/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=497,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2591/500000]
+ train/ActionNoiseL2Loss=0.1665
+ throughput/total_tokens=497,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2592/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=497,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2593/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=497,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2594/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=498,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2595/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=498,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2596/500000]
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=498,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2597/500000]
+ train/ActionNoiseL2Loss=0.1862
+ throughput/total_tokens=498,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2598/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=498,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2599/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=499,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2600/500000]
+ optim/total_grad_norm=2.448
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=499,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2601/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=499,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2602/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=499,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2603/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=499,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2604/500000]
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=499,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2605/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=500,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2606/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=500,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2607/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=500,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2608/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=500,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2609/500000]
+ train/ActionNoiseL2Loss=0.2007
+ throughput/total_tokens=500,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2610/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=501,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2611/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=501,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2612/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=501,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2613/500000]
+ train/ActionNoiseL2Loss=0.1505
+ throughput/total_tokens=501,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2614/500000]
+ train/ActionNoiseL2Loss=0.1569
+ throughput/total_tokens=501,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2615/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=502,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2616/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=502,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2617/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=502,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2618/500000]
+ train/ActionNoiseL2Loss=0.1826
+ throughput/total_tokens=502,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2619/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=502,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2620/500000]
+ optim/total_grad_norm=1.837
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=503,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2621/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=503,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2622/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=503,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2623/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=503,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2624/500000]
+ train/ActionNoiseL2Loss=0.1646
+ throughput/total_tokens=503,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2625/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=504,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2626/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=504,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2627/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=504,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2628/500000]
+ train/ActionNoiseL2Loss=0.1424
+ throughput/total_tokens=504,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2629/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=504,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2630/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=504,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2631/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=505,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2632/500000]
+ train/ActionNoiseL2Loss=0.1559
+ throughput/total_tokens=505,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2633/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=505,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2634/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=505,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2635/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=505,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2636/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=506,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2637/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=506,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2638/500000]
+ train/ActionNoiseL2Loss=0.2114
+ throughput/total_tokens=506,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2639/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=506,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2640/500000]
+ optim/total_grad_norm=2.116
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=506,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2641/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=507,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2642/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=507,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2643/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=507,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2644/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=507,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2645/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=507,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2646/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=508,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2647/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=508,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2648/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=508,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2649/500000]
+ train/ActionNoiseL2Loss=0.1419
+ throughput/total_tokens=508,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2650/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=508,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2651/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=508,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2652/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=509,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2653/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=509,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2654/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=509,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2655/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=509,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2656/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=509,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2657/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=510,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2658/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=510,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2659/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=510,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2660/500000]
+ optim/total_grad_norm=2.526
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=510,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2661/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=510,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2662/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=511,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2663/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=511,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2664/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=511,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2665/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=511,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2666/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=511,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2667/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=512,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2668/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=512,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2669/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=512,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2670/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=512,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2671/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=512,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2672/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=513,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2673/500000]
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=513,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2674/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=513,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2675/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=513,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2676/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=513,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2677/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=513,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2678/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=514,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2679/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=514,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2680/500000]
+ optim/total_grad_norm=1.849
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=514,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2681/500000]
+ train/ActionNoiseL2Loss=0.1255
+ throughput/total_tokens=514,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2682/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=514,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2683/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=515,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2684/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=515,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2685/500000]
+ train/ActionNoiseL2Loss=0.1804
+ throughput/total_tokens=515,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2686/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=515,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2687/500000]
+ train/ActionNoiseL2Loss=0.2007
+ throughput/total_tokens=515,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2688/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=516,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2689/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=516,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2690/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=516,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2691/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=516,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2692/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=516,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2693/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=517,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2694/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=517,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2695/500000]
+ train/ActionNoiseL2Loss=0.1500
+ throughput/total_tokens=517,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2696/500000]
+ train/ActionNoiseL2Loss=0.1940
+ throughput/total_tokens=517,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2697/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=517,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2698/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=518,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2699/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=518,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2700/500000]
+ optim/total_grad_norm=2.418
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=518,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2701/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=518,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2702/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=518,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2703/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=518,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2704/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=519,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2705/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=519,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2706/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=519,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2707/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=519,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2708/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=519,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2709/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=520,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2710/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=520,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2711/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=520,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2712/500000]
+ train/ActionNoiseL2Loss=0.1922
+ throughput/total_tokens=520,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2713/500000]
+ train/ActionNoiseL2Loss=0.2370
+ throughput/total_tokens=520,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2714/500000]
+ train/ActionNoiseL2Loss=0.1939
+ throughput/total_tokens=521,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2715/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=521,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2716/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=521,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2717/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=521,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2718/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=521,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2719/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=522,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2720/500000]
+ optim/total_grad_norm=2.924
+ train/ActionNoiseL2Loss=0.1939
+ throughput/total_tokens=522,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2721/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=522,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2722/500000]
+ train/ActionNoiseL2Loss=0.1837
+ throughput/total_tokens=522,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2723/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=522,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2724/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=523,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2725/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=523,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2726/500000]
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=523,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2727/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=523,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2728/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=523,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2729/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=523,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2730/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=524,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2731/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=524,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2732/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=524,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2733/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=524,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2734/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=524,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2735/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=525,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2736/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=525,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2737/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=525,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2738/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=525,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2739/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=525,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2740/500000]
+ optim/total_grad_norm=1.963
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=526,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2741/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=526,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2742/500000]
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=526,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2743/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=526,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2744/500000]
+ train/ActionNoiseL2Loss=0.1709
+ throughput/total_tokens=526,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2745/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=527,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2746/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=527,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2747/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=527,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2748/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=527,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2749/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=527,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2750/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=528,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2751/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=528,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2752/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=528,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2753/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=528,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2754/500000]
+ train/ActionNoiseL2Loss=0.1522
+ throughput/total_tokens=528,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2755/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=528,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2756/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=529,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2757/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=529,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2758/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=529,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2759/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=529,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2760/500000]
+ optim/total_grad_norm=3.128
+ train/ActionNoiseL2Loss=0.1724
+ throughput/total_tokens=529,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2761/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=530,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2762/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=530,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2763/500000]
+ train/ActionNoiseL2Loss=0.1835
+ throughput/total_tokens=530,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2764/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=530,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2765/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=530,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2766/500000]
+ train/ActionNoiseL2Loss=0.1644
+ throughput/total_tokens=531,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2767/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=531,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2768/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=531,456,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2769/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=531,648,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2770/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=531,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2771/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=532,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2772/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=532,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2773/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=532,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2774/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=532,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2775/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=532,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2776/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=532,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2777/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=533,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2778/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=533,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2779/500000]
+ train/ActionNoiseL2Loss=0.1654
+ throughput/total_tokens=533,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2780/500000]
+ optim/total_grad_norm=1.848
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=533,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2781/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=533,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2782/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=534,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2783/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=534,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2784/500000]
+ train/ActionNoiseL2Loss=0.1603
+ throughput/total_tokens=534,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2785/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=534,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2786/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=534,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2787/500000]
+ train/ActionNoiseL2Loss=0.1807
+ throughput/total_tokens=535,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2788/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=535,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2789/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=535,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2790/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=535,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2791/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=535,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2792/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=536,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2793/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=536,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2794/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=536,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2795/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=536,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2796/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=536,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2797/500000]
+ train/ActionNoiseL2Loss=0.1316
+ throughput/total_tokens=537,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2798/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=537,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2799/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=537,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2800/500000]
+ optim/total_grad_norm=2.579
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=537,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2801/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=537,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2802/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=537,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2803/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=538,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2804/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=538,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2805/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=538,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2806/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=538,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2807/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=538,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2808/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=539,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2809/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=539,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2810/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=539,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2811/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=539,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2812/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=539,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2813/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=540,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2814/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=540,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2815/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=540,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2816/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=540,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2817/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=540,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2818/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=541,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2819/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=541,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2820/500000]
+ optim/total_grad_norm=2.116
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=541,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2821/500000]
+ train/ActionNoiseL2Loss=0.2035
+ throughput/total_tokens=541,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2822/500000]
+ train/ActionNoiseL2Loss=0.1379
+ throughput/total_tokens=541,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2823/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=542,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2824/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=542,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2825/500000]
+ train/ActionNoiseL2Loss=0.1906
+ throughput/total_tokens=542,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2826/500000]
+ train/ActionNoiseL2Loss=0.1711
+ throughput/total_tokens=542,592,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2827/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=542,784,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2828/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=542,976,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2829/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=543,168,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2830/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=543,360,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2831/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=543,552,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2832/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=543,744,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2833/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=543,936,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2834/500000]
+ train/ActionNoiseL2Loss=0.1812
+ throughput/total_tokens=544,128,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2835/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=544,320,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2836/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=544,512,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2837/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=544,704,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2838/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=544,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2839/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=545,088,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2840/500000]
+ optim/total_grad_norm=2.072
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=545,280,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2841/500000]
+ train/ActionNoiseL2Loss=0.1496
+ throughput/total_tokens=545,472,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2842/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=545,664,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2843/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=545,856,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2844/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=546,048,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2845/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=546,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2846/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=546,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2847/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=546,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2848/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=546,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2849/500000]
+ train/ActionNoiseL2Loss=0.1566
+ throughput/total_tokens=547,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2850/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=547,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2851/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=547,392,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2852/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=547,584,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2853/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=547,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2854/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=547,968,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2855/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=548,160,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2856/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=548,352,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2857/500000]
+ train/ActionNoiseL2Loss=0.1431
+ throughput/total_tokens=548,544,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2858/500000]
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=548,736,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2859/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=548,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2860/500000]
+ optim/total_grad_norm=2.336
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=549,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=2861/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=549,312,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2862/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=549,504,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2863/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=549,696,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2864/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=549,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2865/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=550,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2866/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=550,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2867/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=550,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2868/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=550,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2869/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=550,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2870/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=551,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2871/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=551,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2872/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=551,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2873/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=551,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2874/500000]
+ train/ActionNoiseL2Loss=0.1534
+ throughput/total_tokens=551,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2875/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=552,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2876/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=552,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2877/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=552,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2878/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=552,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2879/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=552,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2880/500000]
+ optim/total_grad_norm=1.728
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=552,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2881/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=553,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2882/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=553,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2883/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=553,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2884/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=553,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2885/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=553,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2886/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=554,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2887/500000]
+ train/ActionNoiseL2Loss=0.1609
+ throughput/total_tokens=554,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2888/500000]
+ train/ActionNoiseL2Loss=0.2315
+ throughput/total_tokens=554,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2889/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=554,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2890/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=554,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2891/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=555,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2892/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=555,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2893/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=555,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2894/500000]
+ train/ActionNoiseL2Loss=0.1448
+ throughput/total_tokens=555,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2895/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=555,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2896/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=556,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2897/500000]
+ train/ActionNoiseL2Loss=0.1643
+ throughput/total_tokens=556,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2898/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=556,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2899/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=556,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2900/500000]
+ optim/total_grad_norm=1.585
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=556,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2901/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=556,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2902/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=557,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2903/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=557,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2904/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=557,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2905/500000]
+ train/ActionNoiseL2Loss=0.2152
+ throughput/total_tokens=557,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2906/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=557,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2907/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=558,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2908/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=558,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2909/500000]
+ train/ActionNoiseL2Loss=0.1522
+ throughput/total_tokens=558,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2910/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=558,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2911/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=558,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2912/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=559,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2913/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=559,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2914/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=559,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2915/500000]
+ train/ActionNoiseL2Loss=0.1424
+ throughput/total_tokens=559,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2916/500000]
+ train/ActionNoiseL2Loss=0.1447
+ throughput/total_tokens=559,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2917/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=560,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2918/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=560,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2919/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=560,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2920/500000]
+ optim/total_grad_norm=1.403
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=560,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2921/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=560,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=2922/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=561,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2923/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=561,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2924/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=561,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2925/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=561,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2926/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=561,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2927/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=561,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2928/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=562,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2929/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=562,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2930/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=562,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2931/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=562,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2932/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=562,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2933/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=563,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2934/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=563,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2935/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=563,520,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2936/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=563,712,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2937/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=563,904,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2938/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=564,096,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2939/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=564,288,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=2940/500000]
+ optim/total_grad_norm=2.703
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=564,480,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=2941/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=564,672,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=2942/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=564,864,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=2943/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=565,056,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=2944/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=565,248,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=2945/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=565,440,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=2946/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=565,632,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=2947/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=565,824,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=2948/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=566,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2949/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=566,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2950/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=566,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2951/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=566,592,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2952/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=566,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2953/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=566,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2954/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=567,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2955/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=567,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2956/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=567,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2957/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=567,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2958/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=567,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2959/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=568,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2960/500000]
+ optim/total_grad_norm=2.555
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=568,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2961/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=568,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2962/500000]
+ train/ActionNoiseL2Loss=0.1369
+ throughput/total_tokens=568,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2963/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=568,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2964/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=569,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2965/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=569,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2966/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=569,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2967/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=569,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2968/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=569,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2969/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=570,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2970/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=570,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2971/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=570,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2972/500000]
+ train/ActionNoiseL2Loss=0.1832
+ throughput/total_tokens=570,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2973/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=570,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2974/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=571,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2975/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=571,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2976/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=571,392,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2977/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=571,584,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2978/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=571,776,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2979/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=571,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2980/500000]
+ optim/total_grad_norm=1.982
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=572,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2981/500000]
+ train/ActionNoiseL2Loss=0.1686
+ throughput/total_tokens=572,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2982/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=572,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2983/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=572,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2984/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=572,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2985/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=573,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2986/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=573,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2987/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=573,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2988/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=573,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2989/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=573,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2990/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=574,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=2991/500000]
+ train/ActionNoiseL2Loss=0.1540
+ throughput/total_tokens=574,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2992/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=574,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2993/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=574,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2994/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=574,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2995/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=575,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2996/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=575,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2997/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=575,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2998/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=575,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2999/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=575,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3000/500000]
+ optim/total_grad_norm=1.888
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=576,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/03 [10:26:04] INFO | >> Saving config... checkpoint.py:608
+10/03 [10:26:48] INFO | >> Saving model state... checkpoint.py:796
+10/03 [10:28:03] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [10:29:28] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3001/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=576,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3002/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=576,384,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3003/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=576,576,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=3004/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=576,768,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3005/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=576,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3006/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=577,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3007/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=577,344,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3008/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=577,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3009/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=577,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3010/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=577,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3011/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=578,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3012/500000]
+ train/ActionNoiseL2Loss=0.2090
+ throughput/total_tokens=578,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3013/500000]
+ train/ActionNoiseL2Loss=0.1417
+ throughput/total_tokens=578,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3014/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=578,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3015/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=578,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3016/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=579,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3017/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=579,264,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3018/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=579,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3019/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=579,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3020/500000]
+ optim/total_grad_norm=2.887
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=579,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3021/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=580,032,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3022/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=580,224,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3023/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=580,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3024/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=580,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3025/500000]
+ train/ActionNoiseL2Loss=0.1458
+ throughput/total_tokens=580,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3026/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=580,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3027/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=581,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3028/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=581,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3029/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=581,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3030/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=581,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3031/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=581,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3032/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=582,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3033/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=582,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3034/500000]
+ train/ActionNoiseL2Loss=0.1228
+ throughput/total_tokens=582,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3035/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=582,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3036/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=582,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3037/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=583,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3038/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=583,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3039/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=583,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3040/500000]
+ optim/total_grad_norm=2.172
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=583,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3041/500000]
+ train/ActionNoiseL2Loss=0.2067
+ throughput/total_tokens=583,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3042/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=584,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3043/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=584,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3044/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=584,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3045/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=584,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3046/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=584,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3047/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=585,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3048/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=585,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3049/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=585,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3050/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=585,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3051/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=585,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3052/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=585,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3053/500000]
+ train/ActionNoiseL2Loss=0.1431
+ throughput/total_tokens=586,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3054/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=586,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3055/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=586,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3056/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=586,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3057/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=586,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3058/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=587,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3059/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=587,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3060/500000]
+ optim/total_grad_norm=1.806
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=587,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3061/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=587,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3062/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=587,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3063/500000]
+ train/ActionNoiseL2Loss=0.1815
+ throughput/total_tokens=588,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3064/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=588,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3065/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=588,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3066/500000]
+ train/ActionNoiseL2Loss=0.1626
+ throughput/total_tokens=588,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3067/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=588,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3068/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=589,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3069/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=589,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3070/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=589,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3071/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=589,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3072/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=589,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3073/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=590,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3074/500000]
+ train/ActionNoiseL2Loss=0.1818
+ throughput/total_tokens=590,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3075/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=590,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3076/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=590,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3077/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=590,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3078/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=590,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3079/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=591,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3080/500000]
+ optim/total_grad_norm=1.885
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=591,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3081/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=591,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3082/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=591,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3083/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=591,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3084/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=592,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3085/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=592,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3086/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=592,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3087/500000]
+ train/ActionNoiseL2Loss=0.1973
+ throughput/total_tokens=592,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3088/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=592,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3089/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=593,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3090/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=593,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3091/500000]
+ train/ActionNoiseL2Loss=0.1670
+ throughput/total_tokens=593,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3092/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=593,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3093/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=593,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3094/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=594,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3095/500000]
+ train/ActionNoiseL2Loss=0.1492
+ throughput/total_tokens=594,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3096/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=594,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3097/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=594,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3098/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=594,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3099/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=595,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3100/500000]
+ optim/total_grad_norm=2.380
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=595,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3101/500000]
+ train/ActionNoiseL2Loss=0.1503
+ throughput/total_tokens=595,392,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3102/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=595,584,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3103/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=595,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3104/500000]
+ train/ActionNoiseL2Loss=0.1351
+ throughput/total_tokens=595,968,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3105/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=596,160,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3106/500000]
+ train/ActionNoiseL2Loss=0.1660
+ throughput/total_tokens=596,352,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3107/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=596,544,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3108/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=596,736,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3109/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=596,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3110/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=597,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3111/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=597,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3112/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=597,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3113/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=597,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3114/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=597,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3115/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=598,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3116/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=598,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3117/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=598,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3118/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=598,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3119/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=598,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3120/500000]
+ optim/total_grad_norm=2.193
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=599,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3121/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=599,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3122/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=599,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3123/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=599,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3124/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=599,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3125/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=600,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3126/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=600,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3127/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=600,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3128/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=600,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3129/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=600,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3130/500000]
+ train/ActionNoiseL2Loss=0.1870
+ throughput/total_tokens=600,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3131/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=601,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3132/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=601,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3133/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=601,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3134/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=601,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3135/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=601,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3136/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=602,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3137/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=602,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3138/500000]
+ train/ActionNoiseL2Loss=0.1696
+ throughput/total_tokens=602,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3139/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=602,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3140/500000]
+ optim/total_grad_norm=1.778
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=602,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3141/500000]
+ train/ActionNoiseL2Loss=0.1435
+ throughput/total_tokens=603,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3142/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=603,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3143/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=603,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3144/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=603,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3145/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=603,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3146/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=604,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3147/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=604,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3148/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=604,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3149/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=604,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3150/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=604,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3151/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=604,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3152/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=605,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3153/500000]
+ train/ActionNoiseL2Loss=0.1924
+ throughput/total_tokens=605,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3154/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=605,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3155/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=605,760,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3156/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=605,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3157/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=606,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3158/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=606,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3159/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=606,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3160/500000]
+ optim/total_grad_norm=2.030
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=606,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3161/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=606,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3162/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=607,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3163/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=607,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3164/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=607,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3165/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=607,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3166/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=607,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3167/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=608,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3168/500000]
+ train/ActionNoiseL2Loss=0.1351
+ throughput/total_tokens=608,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3169/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=608,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3170/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=608,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3171/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=608,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3172/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=609,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3173/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=609,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3174/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=609,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3175/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=609,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3176/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=609,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3177/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=609,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3178/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=610,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3179/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=610,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3180/500000]
+ optim/total_grad_norm=1.999
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=610,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3181/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=610,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3182/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=610,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3183/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=611,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3184/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=611,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3185/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=611,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3186/500000]
+ train/ActionNoiseL2Loss=0.1462
+ throughput/total_tokens=611,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3187/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=611,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3188/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=612,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3189/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=612,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3190/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=612,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3191/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=612,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3192/500000]
+ train/ActionNoiseL2Loss=0.1660
+ throughput/total_tokens=612,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3193/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=613,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3194/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=613,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3195/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=613,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3196/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=613,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3197/500000]
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=613,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3198/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=614,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3199/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=614,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3200/500000]
+ optim/total_grad_norm=1.533
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=614,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3201/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=614,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3202/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=614,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3203/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=614,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3204/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=615,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3205/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=615,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3206/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=615,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3207/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=615,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3208/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=615,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3209/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=616,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3210/500000]
+ train/ActionNoiseL2Loss=0.1660
+ throughput/total_tokens=616,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3211/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=616,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3212/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=616,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3213/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=616,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3214/500000]
+ train/ActionNoiseL2Loss=0.1718
+ throughput/total_tokens=617,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3215/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=617,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3216/500000]
+ train/ActionNoiseL2Loss=0.1676
+ throughput/total_tokens=617,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3217/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=617,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3218/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=617,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3219/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=618,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3220/500000]
+ optim/total_grad_norm=1.210
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=618,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3221/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=618,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3222/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=618,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3223/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=618,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3224/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=619,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3225/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=619,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3226/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=619,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3227/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=619,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3228/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=619,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3229/500000]
+ train/ActionNoiseL2Loss=0.1400
+ throughput/total_tokens=619,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3230/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=620,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3231/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=620,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3232/500000]
+ train/ActionNoiseL2Loss=0.2105
+ throughput/total_tokens=620,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3233/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=620,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3234/500000]
+ train/ActionNoiseL2Loss=0.1958
+ throughput/total_tokens=620,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3235/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=621,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3236/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=621,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3237/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=621,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3238/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=621,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3239/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=621,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3240/500000]
+ optim/total_grad_norm=1.944
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=622,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3241/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=622,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3242/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=622,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3243/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=622,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3244/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=622,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3245/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=623,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3246/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=623,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3247/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=623,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3248/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=623,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3249/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=623,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3250/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=624,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3251/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=624,192,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3252/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=624,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3253/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=624,576,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3254/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=624,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3255/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=624,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3256/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=625,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3257/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=625,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3258/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=625,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3259/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=625,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3260/500000]
+ optim/total_grad_norm=1.421
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=625,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3261/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=626,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3262/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=626,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3263/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=626,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3264/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=626,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3265/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=626,880,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3266/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=627,072,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3267/500000]
+ train/ActionNoiseL2Loss=0.1594
+ throughput/total_tokens=627,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3268/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=627,456,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3269/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=627,648,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3270/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=627,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3271/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=628,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3272/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=628,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3273/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=628,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3274/500000]
+ train/ActionNoiseL2Loss=0.1715
+ throughput/total_tokens=628,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3275/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=628,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3276/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=628,992,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3277/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=629,184,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3278/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=629,376,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3279/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=629,568,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3280/500000]
+ optim/total_grad_norm=2.410
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=629,760,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3281/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=629,952,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3282/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=630,144,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3283/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=630,336,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3284/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=630,528,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3285/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=630,720,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3286/500000]
+ train/ActionNoiseL2Loss=0.2398
+ throughput/total_tokens=630,912,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3287/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=631,104,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3288/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=631,296,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3289/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=631,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3290/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=631,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3291/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=631,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3292/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=632,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3293/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=632,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3294/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=632,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3295/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=632,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3296/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=632,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3297/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=633,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3298/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=633,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3299/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=633,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3300/500000]
+ optim/total_grad_norm=2.039
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=633,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3301/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=633,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3302/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=633,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3303/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=634,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3304/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=634,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3305/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=634,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3306/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=634,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3307/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=634,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3308/500000]
+ train/ActionNoiseL2Loss=0.1956
+ throughput/total_tokens=635,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3309/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=635,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3310/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=635,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3311/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=635,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3312/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=635,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3313/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=636,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3314/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=636,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3315/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=636,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3316/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=636,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3317/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=636,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3318/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=637,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3319/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=637,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3320/500000]
+ optim/total_grad_norm=2.141
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=637,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3321/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=637,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3322/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=637,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3323/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=638,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3324/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=638,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3325/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=638,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3326/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=638,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3327/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=638,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3328/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=638,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3329/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=639,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3330/500000]
+ train/ActionNoiseL2Loss=0.1569
+ throughput/total_tokens=639,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3331/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=639,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3332/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=639,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3333/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=639,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3334/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=640,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3335/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=640,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3336/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=640,512,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3337/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=640,704,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3338/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=640,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3339/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=641,088,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3340/500000]
+ optim/total_grad_norm=2.466
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=641,280,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3341/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=641,472,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3342/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=641,664,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3343/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=641,856,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3344/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=642,048,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3345/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=642,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3346/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=642,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3347/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=642,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3348/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=642,816,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=3349/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=643,008,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=3350/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=643,200,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=3351/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=643,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3352/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=643,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3353/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=643,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3354/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=643,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3355/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=644,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3356/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=644,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3357/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=644,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3358/500000]
+ train/ActionNoiseL2Loss=0.2062
+ throughput/total_tokens=644,736,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3359/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=644,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3360/500000]
+ optim/total_grad_norm=1.627
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=645,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3361/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=645,312,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3362/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=645,504,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3363/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=645,696,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3364/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=645,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3365/500000]
+ train/ActionNoiseL2Loss=0.1928
+ throughput/total_tokens=646,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3366/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=646,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3367/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=646,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3368/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=646,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3369/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=646,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3370/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=647,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3371/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=647,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3372/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=647,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3373/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=647,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3374/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=647,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3375/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=648,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3376/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=648,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3377/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=648,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3378/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=648,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3379/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=648,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3380/500000]
+ optim/total_grad_norm=2.269
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=648,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3381/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=649,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3382/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=649,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3383/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=649,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3384/500000]
+ train/ActionNoiseL2Loss=0.1490
+ throughput/total_tokens=649,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3385/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=649,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3386/500000]
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=650,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3387/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=650,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3388/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=650,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3389/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=650,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3390/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=650,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3391/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=651,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3392/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=651,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3393/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=651,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3394/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=651,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3395/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=651,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3396/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=652,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3397/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=652,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3398/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=652,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3399/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=652,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3400/500000]
+ optim/total_grad_norm=1.654
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=652,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3401/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=652,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3402/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=653,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3403/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=653,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3404/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=653,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3405/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=653,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3406/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=653,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3407/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=654,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3408/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=654,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3409/500000]
+ train/ActionNoiseL2Loss=0.1612
+ throughput/total_tokens=654,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3410/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=654,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3411/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=654,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3412/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=655,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3413/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=655,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3414/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=655,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3415/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=655,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3416/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=655,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3417/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=656,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3418/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=656,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3419/500000]
+ train/ActionNoiseL2Loss=0.2083
+ throughput/total_tokens=656,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3420/500000]
+ optim/total_grad_norm=1.546
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=656,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3421/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=656,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3422/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=657,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3423/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=657,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3424/500000]
+ train/ActionNoiseL2Loss=0.1598
+ throughput/total_tokens=657,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3425/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=657,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3426/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=657,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3427/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=657,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3428/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=658,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3429/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=658,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3430/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=658,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3431/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=658,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3432/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=658,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3433/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=659,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3434/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=659,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3435/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=659,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3436/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=659,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3437/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=659,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3438/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=660,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3439/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=660,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3440/500000]
+ optim/total_grad_norm=2.102
+ train/ActionNoiseL2Loss=0.1433
+ throughput/total_tokens=660,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3441/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=660,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3442/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=660,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3443/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=661,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3444/500000]
+ train/ActionNoiseL2Loss=0.1541
+ throughput/total_tokens=661,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3445/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=661,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3446/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=661,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3447/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=661,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3448/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=662,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3449/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=662,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3450/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=662,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3451/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=662,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3452/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=662,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3453/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=662,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3454/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=663,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3455/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=663,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3456/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=663,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3457/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=663,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3458/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=663,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3459/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=664,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3460/500000]
+ optim/total_grad_norm=2.668
+ train/ActionNoiseL2Loss=0.1716
+ throughput/total_tokens=664,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3461/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=664,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3462/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=664,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3463/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=664,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3464/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=665,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3465/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=665,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3466/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=665,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3467/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=665,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3468/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=665,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3469/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=666,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3470/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=666,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3471/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=666,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3472/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=666,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3473/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=666,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3474/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=667,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3475/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=667,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3476/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=667,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3477/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=667,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3478/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=667,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3479/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=667,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3480/500000]
+ optim/total_grad_norm=1.802
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=668,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3481/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=668,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3482/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=668,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3483/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=668,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3484/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=668,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3485/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=669,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3486/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=669,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3487/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=669,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3488/500000]
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=669,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3489/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=669,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3490/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=670,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3491/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=670,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3492/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=670,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3493/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=670,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3494/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=670,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3495/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=671,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3496/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=671,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3497/500000]
+ train/ActionNoiseL2Loss=0.1900
+ throughput/total_tokens=671,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3498/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=671,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3499/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=671,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3500/500000]
+ optim/total_grad_norm=1.996
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=672,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/03 [13:23:05] INFO | >> Saving config... checkpoint.py:608
+10/03 [13:23:49] INFO | >> Saving model state... checkpoint.py:796
+10/03 [13:25:03] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [13:26:28] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3501/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=672,192,000
+ throughput/device/tokens_per_second=1,194
+ throughput/device/batches_per_second=0.0498
+[step=3502/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=672,384,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=3503/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=672,576,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=3504/500000]
+ train/ActionNoiseL2Loss=0.1725
+ throughput/total_tokens=672,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3505/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=672,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3506/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=673,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3507/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=673,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3508/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=673,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3509/500000]
+ train/ActionNoiseL2Loss=0.1575
+ throughput/total_tokens=673,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3510/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=673,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3511/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=674,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3512/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=674,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3513/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=674,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3514/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=674,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3515/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=674,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3516/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=675,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3517/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=675,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3518/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=675,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3519/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=675,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3520/500000]
+ optim/total_grad_norm=2.453
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=675,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3521/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=676,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3522/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=676,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3523/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=676,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3524/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=676,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3525/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=676,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3526/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=676,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3527/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=677,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3528/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=677,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3529/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=677,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3530/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=677,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3531/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=677,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3532/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=678,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3533/500000]
+ train/ActionNoiseL2Loss=0.1886
+ throughput/total_tokens=678,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3534/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=678,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3535/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=678,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3536/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=678,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3537/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=679,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3538/500000]
+ train/ActionNoiseL2Loss=0.1715
+ throughput/total_tokens=679,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3539/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=679,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3540/500000]
+ optim/total_grad_norm=1.649
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=679,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3541/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=679,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3542/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=680,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3543/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=680,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3544/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=680,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3545/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=680,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3546/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=680,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3547/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=681,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3548/500000]
+ train/ActionNoiseL2Loss=0.1403
+ throughput/total_tokens=681,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3549/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=681,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3550/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=681,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3551/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=681,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3552/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=681,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3553/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=682,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3554/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=682,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3555/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=682,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3556/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=682,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3557/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=682,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3558/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=683,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3559/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=683,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3560/500000]
+ optim/total_grad_norm=1.867
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=683,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3561/500000]
+ train/ActionNoiseL2Loss=0.1608
+ throughput/total_tokens=683,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3562/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=683,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3563/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=684,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3564/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=684,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3565/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=684,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3566/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=684,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3567/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=684,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3568/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=685,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3569/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=685,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3570/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=685,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3571/500000]
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=685,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3572/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=685,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3573/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=686,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3574/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=686,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3575/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=686,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3576/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=686,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3577/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=686,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3578/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=686,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3579/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=687,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3580/500000]
+ optim/total_grad_norm=1.278
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=687,360,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3581/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=687,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3582/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=687,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3583/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=687,936,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3584/500000]
+ train/ActionNoiseL2Loss=0.1614
+ throughput/total_tokens=688,128,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3585/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=688,320,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3586/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=688,512,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3587/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=688,704,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3588/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=688,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3589/500000]
+ train/ActionNoiseL2Loss=0.2241
+ throughput/total_tokens=689,088,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3590/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=689,280,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3591/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=689,472,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3592/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=689,664,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3593/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=689,856,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3594/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=690,048,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3595/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=690,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3596/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=690,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3597/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=690,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3598/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=690,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3599/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=691,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3600/500000]
+ optim/total_grad_norm=2.287
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=691,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3601/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=691,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3602/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=691,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3603/500000]
+ train/ActionNoiseL2Loss=0.1746
+ throughput/total_tokens=691,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3604/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=691,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3605/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=692,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3606/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=692,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3607/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=692,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3608/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=692,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3609/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=692,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3610/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=693,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3611/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=693,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3612/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=693,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3613/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=693,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3614/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=693,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3615/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=694,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3616/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=694,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3617/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=694,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3618/500000]
+ train/ActionNoiseL2Loss=0.1581
+ throughput/total_tokens=694,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3619/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=694,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3620/500000]
+ optim/total_grad_norm=1.977
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=695,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3621/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=695,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3622/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=695,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3623/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=695,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3624/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=695,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3625/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=696,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3626/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=696,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3627/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=696,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3628/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=696,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3629/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=696,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3630/500000]
+ train/ActionNoiseL2Loss=0.1947
+ throughput/total_tokens=696,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3631/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=697,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3632/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=697,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3633/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=697,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3634/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=697,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3635/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=697,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3636/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=698,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3637/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=698,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3638/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=698,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3639/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=698,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3640/500000]
+ optim/total_grad_norm=2.405
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=698,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3641/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=699,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3642/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=699,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3643/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=699,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3644/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=699,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3645/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=699,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3646/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=700,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3647/500000]
+ train/ActionNoiseL2Loss=0.2578
+ throughput/total_tokens=700,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3648/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=700,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3649/500000]
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=700,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3650/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=700,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3651/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=700,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3652/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=701,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3653/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=701,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3654/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=701,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3655/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=701,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3656/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=701,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3657/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=702,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3658/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=702,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3659/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=702,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3660/500000]
+ optim/total_grad_norm=1.550
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=702,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3661/500000]
+ train/ActionNoiseL2Loss=0.1454
+ throughput/total_tokens=702,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3662/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=703,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3663/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=703,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3664/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=703,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3665/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=703,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3666/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=703,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3667/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=704,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3668/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=704,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3669/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=704,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3670/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=704,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3671/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=704,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3672/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=705,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3673/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=705,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3674/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=705,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3675/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=705,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3676/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=705,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3677/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=705,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3678/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=706,176,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3679/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=706,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3680/500000]
+ optim/total_grad_norm=2.427
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=706,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3681/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=706,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3682/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=706,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3683/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=707,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3684/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=707,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3685/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=707,520,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3686/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=707,712,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3687/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=707,904,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3688/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=708,096,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3689/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=708,288,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3690/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=708,480,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3691/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=708,672,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3692/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=708,864,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3693/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=709,056,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3694/500000]
+ train/ActionNoiseL2Loss=0.1934
+ throughput/total_tokens=709,248,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3695/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=709,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3696/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=709,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3697/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=709,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3698/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=710,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3699/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=710,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3700/500000]
+ optim/total_grad_norm=1.380
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=710,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3701/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=710,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3702/500000]
+ train/ActionNoiseL2Loss=0.1398
+ throughput/total_tokens=710,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3703/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=710,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3704/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=711,168,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3705/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=711,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3706/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=711,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3707/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=711,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3708/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=711,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3709/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=712,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3710/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=712,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=46,467
+[step=3711/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=712,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3712/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=712,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3713/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=712,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3714/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=713,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3715/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=713,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3716/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=713,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3717/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=713,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3718/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=713,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3719/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=714,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3720/500000]
+ optim/total_grad_norm=2.256
+ train/ActionNoiseL2Loss=0.1556
+ throughput/total_tokens=714,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3721/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=714,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3722/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=714,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3723/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=714,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3724/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=715,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3725/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=715,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3726/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=715,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3727/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=715,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3728/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=715,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3729/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=715,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3730/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=716,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3731/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=716,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3732/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=716,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3733/500000]
+ train/ActionNoiseL2Loss=0.1255
+ throughput/total_tokens=716,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3734/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=716,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3735/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=717,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3736/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=717,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3737/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=717,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3738/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=717,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3739/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=717,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3740/500000]
+ optim/total_grad_norm=1.353
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=718,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3741/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=718,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3742/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=718,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3743/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=718,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3744/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=718,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3745/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=719,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3746/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=719,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3747/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=719,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3748/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=719,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3749/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=719,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3750/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=720,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3751/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=720,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3752/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=720,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3753/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=720,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3754/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=720,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3755/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=720,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3756/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=721,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3757/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=721,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3758/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=721,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3759/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=721,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3760/500000]
+ optim/total_grad_norm=1.772
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=721,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3761/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=722,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3762/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=722,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3763/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=722,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3764/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=722,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3765/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=722,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3766/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=723,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3767/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=723,264,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3768/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=723,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3769/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=723,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3770/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=723,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3771/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=724,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3772/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=724,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3773/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=724,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3774/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=724,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3775/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=724,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3776/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=724,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3777/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=725,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3778/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=725,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3779/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=725,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3780/500000]
+ optim/total_grad_norm=2.220
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=725,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3781/500000]
+ train/ActionNoiseL2Loss=0.2008
+ throughput/total_tokens=725,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3782/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=726,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3783/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=726,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3784/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=726,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3785/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=726,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3786/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=726,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3787/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=727,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3788/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=727,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3789/500000]
+ train/ActionNoiseL2Loss=0.1569
+ throughput/total_tokens=727,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3790/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=727,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3791/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=727,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3792/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=728,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3793/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=728,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3794/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=728,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3795/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=728,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3796/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=728,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3797/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=729,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3798/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=729,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3799/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=729,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3800/500000]
+ optim/total_grad_norm=1.805
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=729,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3801/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=729,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3802/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=729,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3803/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=730,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3804/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=730,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3805/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=730,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3806/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=730,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3807/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=730,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3808/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=731,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3809/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=731,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3810/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=731,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3811/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=731,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3812/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=731,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3813/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=732,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3814/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=732,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3815/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=732,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3816/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=732,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3817/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=732,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3818/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=733,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3819/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=733,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3820/500000]
+ optim/total_grad_norm=2.173
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=733,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3821/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=733,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3822/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=733,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3823/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=734,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3824/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=734,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3825/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=734,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3826/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=734,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3827/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=734,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3828/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=734,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3829/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=735,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3830/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=735,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3831/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=735,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3832/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=735,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3833/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=735,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3834/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=736,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3835/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=736,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3836/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=736,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3837/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=736,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3838/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=736,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3839/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=737,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3840/500000]
+ optim/total_grad_norm=1.343
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=737,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3841/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=737,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3842/500000]
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=737,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3843/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=737,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3844/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=738,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3845/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=738,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3846/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=738,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3847/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=738,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3848/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=738,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3849/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=739,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3850/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=739,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3851/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=739,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3852/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=739,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3853/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=739,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3854/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=739,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3855/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=740,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3856/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=740,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3857/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=740,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3858/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=740,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3859/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=740,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3860/500000]
+ optim/total_grad_norm=2.077
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=741,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3861/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=741,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3862/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=741,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3863/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=741,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3864/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=741,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3865/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=742,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3866/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=742,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3867/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=742,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3868/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=742,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3869/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=742,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3870/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=743,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3871/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=743,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3872/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=743,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3873/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=743,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3874/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=743,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3875/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=744,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3876/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=744,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3877/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=744,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3878/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=744,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3879/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=744,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3880/500000]
+ optim/total_grad_norm=1.841
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=744,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3881/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=745,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3882/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=745,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3883/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=745,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3884/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=745,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3885/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=745,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3886/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=746,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3887/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=746,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=3888/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=746,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3889/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=746,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3890/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=746,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3891/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=747,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3892/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=747,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=3893/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=747,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3894/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=747,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3895/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=747,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3896/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=748,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3897/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=748,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3898/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=748,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3899/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=748,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3900/500000]
+ optim/total_grad_norm=1.355
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=748,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3901/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=748,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3902/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=749,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3903/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=749,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3904/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=749,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3905/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=749,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3906/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=749,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3907/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=750,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3908/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=750,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3909/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=750,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3910/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=750,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=3911/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=750,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3912/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=751,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3913/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=751,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3914/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=751,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3915/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=751,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3916/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=751,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3917/500000]
+ train/ActionNoiseL2Loss=0.1837
+ throughput/total_tokens=752,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3918/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=752,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3919/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=752,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3920/500000]
+ optim/total_grad_norm=1.666
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=752,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3921/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=752,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3922/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=753,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3923/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=753,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3924/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=753,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3925/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=753,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3926/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=753,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3927/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=753,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3928/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=754,176,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3929/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=754,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3930/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=754,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3931/500000]
+ train/ActionNoiseL2Loss=0.1554
+ throughput/total_tokens=754,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3932/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=754,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3933/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=755,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3934/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=755,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3935/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=755,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3936/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=755,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3937/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=755,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3938/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=756,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3939/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=756,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3940/500000]
+ optim/total_grad_norm=1.531
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=756,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3941/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=756,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3942/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=756,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3943/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=757,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3944/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=757,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3945/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=757,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3946/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=757,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3947/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=757,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3948/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=758,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3949/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=758,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3950/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=758,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3951/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=758,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3952/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=758,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3953/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=758,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3954/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=759,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3955/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=759,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3956/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=759,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3957/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=759,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3958/500000]
+ train/ActionNoiseL2Loss=0.1400
+ throughput/total_tokens=759,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3959/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=760,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3960/500000]
+ optim/total_grad_norm=1.465
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=760,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3961/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=760,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3962/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=760,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3963/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=760,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3964/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=761,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3965/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=761,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3966/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=761,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3967/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=761,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3968/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=761,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3969/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=762,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3970/500000]
+ train/ActionNoiseL2Loss=0.1832
+ throughput/total_tokens=762,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3971/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=762,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3972/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=762,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3973/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=762,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3974/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=763,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3975/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=763,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3976/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=763,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3977/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=763,584,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3978/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=763,776,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3979/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=763,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3980/500000]
+ optim/total_grad_norm=2.147
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=764,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3981/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=764,352,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3982/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=764,544,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3983/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=764,736,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3984/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=764,928,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3985/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=765,120,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3986/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=765,312,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3987/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=765,504,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3988/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=765,696,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3989/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=765,888,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3990/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=766,080,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=3991/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=766,272,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3992/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=766,464,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3993/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=766,656,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3994/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=766,848,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3995/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=767,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3996/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=767,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3997/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=767,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3998/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=767,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=3999/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=767,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4000/500000]
+ optim/total_grad_norm=2.383
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=768,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/03 [16:20:00] INFO | >> Saving config... checkpoint.py:608
+10/03 [16:20:49] INFO | >> Saving model state... checkpoint.py:796
+10/03 [16:22:03] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [16:23:29] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4001/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=768,192,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0497
+[step=4002/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=768,384,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=4003/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=768,576,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=4004/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=768,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4005/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=768,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4006/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=769,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4007/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=769,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4008/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=769,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4009/500000]
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=769,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4010/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=769,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4011/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=770,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4012/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=770,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4013/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=770,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4014/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=770,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4015/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=770,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4016/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=771,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4017/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=771,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4018/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=771,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4019/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=771,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4020/500000]
+ optim/total_grad_norm=1.393
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=771,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4021/500000]
+ train/ActionNoiseL2Loss=0.1931
+ throughput/total_tokens=772,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4022/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=772,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4023/500000]
+ train/ActionNoiseL2Loss=0.1417
+ throughput/total_tokens=772,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4024/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=772,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4025/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=772,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4026/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=772,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4027/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=773,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4028/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=773,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4029/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=773,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4030/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=773,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4031/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=773,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4032/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=774,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4033/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=774,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4034/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=774,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4035/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=774,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4036/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=774,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4037/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=775,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4038/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=775,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4039/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=775,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4040/500000]
+ optim/total_grad_norm=2.075
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=775,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4041/500000]
+ train/ActionNoiseL2Loss=0.1662
+ throughput/total_tokens=775,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4042/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=776,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4043/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=776,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4044/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=776,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4045/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=776,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4046/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=776,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4047/500000]
+ train/ActionNoiseL2Loss=0.1496
+ throughput/total_tokens=777,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4048/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=777,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4049/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=777,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4050/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=777,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4051/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=777,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4052/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=777,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4053/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=778,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4054/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=778,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4055/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=778,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4056/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=778,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4057/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=778,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4058/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=779,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4059/500000]
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=779,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4060/500000]
+ optim/total_grad_norm=1.566
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=779,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4061/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=779,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4062/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=779,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4063/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=780,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4064/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=780,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4065/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=780,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4066/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=780,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4067/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=780,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4068/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=781,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4069/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=781,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4070/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=781,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4071/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=781,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4072/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=781,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4073/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=782,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4074/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=782,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4075/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=782,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4076/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=782,592,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4077/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=782,784,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4078/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=782,976,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4079/500000]
+ train/ActionNoiseL2Loss=0.1681
+ throughput/total_tokens=783,168,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4080/500000]
+ optim/total_grad_norm=1.853
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=783,360,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4081/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=783,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4082/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=783,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4083/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=783,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4084/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=784,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4085/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=784,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4086/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=784,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4087/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=784,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4088/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=784,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4089/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=785,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4090/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=785,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4091/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=785,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4092/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=785,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4093/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=785,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4094/500000]
+ train/ActionNoiseL2Loss=0.1228
+ throughput/total_tokens=786,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4095/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=786,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4096/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=786,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4097/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=786,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4098/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=786,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4099/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=787,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4100/500000]
+ optim/total_grad_norm=1.208
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=787,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4101/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=787,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4102/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=787,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4103/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=787,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4104/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=787,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4105/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=788,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4106/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=788,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4107/500000]
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=788,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4108/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=788,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4109/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=788,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4110/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=789,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4111/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=789,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4112/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=789,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4113/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=789,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4114/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=789,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4115/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=790,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4116/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=790,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4117/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=790,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4118/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=790,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4119/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=790,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4120/500000]
+ optim/total_grad_norm=2.657
+ train/ActionNoiseL2Loss=0.2157
+ throughput/total_tokens=791,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4121/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=791,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4122/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=791,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4123/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=791,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4124/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=791,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4125/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=792,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4126/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=792,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4127/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=792,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4128/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=792,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4129/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=792,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4130/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=792,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4131/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=793,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4132/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=793,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4133/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=793,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4134/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=793,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4135/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=793,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4136/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=794,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4137/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=794,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4138/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=794,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4139/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=794,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4140/500000]
+ optim/total_grad_norm=1.473
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=794,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4141/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=795,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4142/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=795,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4143/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=795,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4144/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=795,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4145/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=795,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4146/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=796,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4147/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=796,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4148/500000]
+ train/ActionNoiseL2Loss=0.1593
+ throughput/total_tokens=796,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4149/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=796,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4150/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=796,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4151/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=796,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4152/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=797,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4153/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=797,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4154/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=797,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4155/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=797,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4156/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=797,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4157/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=798,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4158/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=798,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4159/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=798,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4160/500000]
+ optim/total_grad_norm=1.719
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=798,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4161/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=798,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4162/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=799,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4163/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=799,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4164/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=799,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4165/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=799,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4166/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=799,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4167/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=800,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4168/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=800,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4169/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=800,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4170/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=800,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4171/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=800,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4172/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=801,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4173/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=801,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4174/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=801,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4175/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=801,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4176/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=801,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4177/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=801,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4178/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=802,176,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4179/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=802,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4180/500000]
+ optim/total_grad_norm=1.336
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=802,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4181/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=802,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4182/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=802,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4183/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=803,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4184/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=803,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4185/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=803,520,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4186/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=803,712,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4187/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=803,904,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4188/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=804,096,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4189/500000]
+ train/ActionNoiseL2Loss=0.1936
+ throughput/total_tokens=804,288,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4190/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=804,480,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4191/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=804,672,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4192/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=804,864,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4193/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=805,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4194/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=805,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4195/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=805,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4196/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=805,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4197/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=805,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4198/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=806,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4199/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=806,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4200/500000]
+ optim/total_grad_norm=1.603
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=806,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4201/500000]
+ train/ActionNoiseL2Loss=0.1983
+ throughput/total_tokens=806,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4202/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=806,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4203/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=806,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4204/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=807,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4205/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=807,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4206/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=807,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4207/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=807,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4208/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=807,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4209/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=808,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4210/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=808,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4211/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=808,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4212/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=808,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4213/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=808,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4214/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=809,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4215/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=809,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4216/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=809,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4217/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=809,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4218/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=809,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4219/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=810,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4220/500000]
+ optim/total_grad_norm=1.660
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=810,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4221/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=810,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4222/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=810,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4223/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=810,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4224/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=811,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4225/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=811,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4226/500000]
+ train/ActionNoiseL2Loss=0.1522
+ throughput/total_tokens=811,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4227/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=811,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4228/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=811,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4229/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=811,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4230/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=812,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4231/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=812,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4232/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=812,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4233/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=812,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4234/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=812,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4235/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=813,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4236/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=813,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4237/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=813,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4238/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=813,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4239/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=813,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4240/500000]
+ optim/total_grad_norm=2.298
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=814,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4241/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=814,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4242/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=814,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4243/500000]
+ train/ActionNoiseL2Loss=0.2242
+ throughput/total_tokens=814,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4244/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=814,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4245/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=815,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4246/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=815,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4247/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=815,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4248/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=815,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4249/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=815,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4250/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=816,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4251/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=816,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4252/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=816,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4253/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=816,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4254/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=816,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4255/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=816,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4256/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=817,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4257/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=817,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4258/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=817,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4259/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=817,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4260/500000]
+ optim/total_grad_norm=1.982
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=817,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4261/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=818,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4262/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=818,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4263/500000]
+ train/ActionNoiseL2Loss=0.1570
+ throughput/total_tokens=818,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4264/500000]
+ train/ActionNoiseL2Loss=0.1909
+ throughput/total_tokens=818,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4265/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=818,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4266/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=819,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4267/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=819,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4268/500000]
+ train/ActionNoiseL2Loss=0.1375
+ throughput/total_tokens=819,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4269/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=819,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4270/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=819,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4271/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=820,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4272/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=820,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4273/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=820,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4274/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=820,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4275/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=820,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4276/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=820,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4277/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=821,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4278/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=821,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4279/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=821,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4280/500000]
+ optim/total_grad_norm=2.257
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=821,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4281/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=821,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4282/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=822,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4283/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=822,336,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4284/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=822,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4285/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=822,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4286/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=822,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4287/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=823,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4288/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=823,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4289/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=823,488,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4290/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=823,680,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4291/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=823,872,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4292/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=824,064,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4293/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=824,256,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4294/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=824,448,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4295/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=824,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4296/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=824,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4297/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=825,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4298/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=825,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4299/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=825,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4300/500000]
+ optim/total_grad_norm=2.028
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=825,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4301/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=825,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4302/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=825,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4303/500000]
+ train/ActionNoiseL2Loss=0.1327
+ throughput/total_tokens=826,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4304/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=826,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4305/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=826,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4306/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=826,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4307/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=826,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4308/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=827,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4309/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=827,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4310/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=827,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4311/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=827,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4312/500000]
+ train/ActionNoiseL2Loss=0.1295
+ throughput/total_tokens=827,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4313/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=828,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4314/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=828,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4315/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=828,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4316/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=828,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4317/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=828,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4318/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=829,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4319/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=829,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4320/500000]
+ optim/total_grad_norm=1.746
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=829,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4321/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=829,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4322/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=829,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4323/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=830,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4324/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=830,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4325/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=830,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4326/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=830,592,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4327/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=830,784,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4328/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=830,976,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4329/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=831,168,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4330/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=831,360,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4331/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=831,552,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4332/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=831,744,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4333/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=831,936,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4334/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=832,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4335/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=832,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4336/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=832,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4337/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=832,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4338/500000]
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=832,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4339/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=833,088,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4340/500000]
+ optim/total_grad_norm=1.925
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=833,280,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4341/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=833,472,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4342/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=833,664,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4343/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=833,856,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4344/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=834,048,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4345/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=834,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4346/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=834,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4347/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=834,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4348/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=834,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4349/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=835,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4350/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=835,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4351/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=835,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4352/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=835,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4353/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=835,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4354/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=835,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4355/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=836,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4356/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=836,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4357/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=836,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4358/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=836,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4359/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=836,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4360/500000]
+ optim/total_grad_norm=1.670
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=837,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4361/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=837,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4362/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=837,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4363/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=837,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4364/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=837,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4365/500000]
+ train/ActionNoiseL2Loss=0.1793
+ throughput/total_tokens=838,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4366/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=838,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4367/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=838,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4368/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=838,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4369/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=838,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4370/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=839,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4371/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=839,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4372/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=839,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4373/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=839,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4374/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=839,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4375/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=840,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4376/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=840,192,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4377/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=840,384,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4378/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=840,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4379/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=840,768,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4380/500000]
+ optim/total_grad_norm=1.478
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=840,960,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4381/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=841,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4382/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=841,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4383/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=841,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4384/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=841,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4385/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=841,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4386/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=842,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4387/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=842,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4388/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=842,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4389/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=842,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4390/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=842,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4391/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=843,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4392/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=843,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4393/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=843,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4394/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=843,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4395/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=843,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4396/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=844,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4397/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=844,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4398/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=844,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4399/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=844,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4400/500000]
+ optim/total_grad_norm=2.143
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=844,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4401/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=844,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4402/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=845,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4403/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=845,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4404/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=845,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4405/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=845,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4406/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=845,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4407/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=846,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4408/500000]
+ train/ActionNoiseL2Loss=0.1505
+ throughput/total_tokens=846,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4409/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=846,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4410/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=846,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4411/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=846,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4412/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=847,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4413/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=847,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4414/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=847,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4415/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=847,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4416/500000]
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=847,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4417/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=848,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4418/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=848,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4419/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=848,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4420/500000]
+ optim/total_grad_norm=1.514
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=848,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4421/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=848,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4422/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=849,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4423/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=849,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4424/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=849,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4425/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=849,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4426/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=849,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4427/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=849,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4428/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=850,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4429/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=850,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4430/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=850,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4431/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=850,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4432/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=850,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4433/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=851,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4434/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=851,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4435/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=851,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4436/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=851,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4437/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=851,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4438/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=852,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4439/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=852,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4440/500000]
+ optim/total_grad_norm=1.861
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=852,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4441/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=852,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4442/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=852,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4443/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=853,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4444/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=853,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4445/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=853,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4446/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=853,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4447/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=853,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4448/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=854,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4449/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=854,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4450/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=854,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4451/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=854,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4452/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=854,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4453/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=854,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4454/500000]
+ train/ActionNoiseL2Loss=0.1191
+ throughput/total_tokens=855,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4455/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=855,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4456/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=855,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4457/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=855,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4458/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=855,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4459/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=856,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4460/500000]
+ optim/total_grad_norm=1.244
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=856,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4461/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=856,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4462/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=856,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4463/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=856,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4464/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=857,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4465/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=857,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4466/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=857,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4467/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=857,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4468/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=857,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4469/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=858,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4470/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=858,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4471/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=858,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4472/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=858,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4473/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=858,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4474/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=859,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4475/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=859,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4476/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=859,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4477/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=859,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4478/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=859,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4479/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=859,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4480/500000]
+ optim/total_grad_norm=1.447
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=860,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4481/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=860,352,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4482/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=860,544,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4483/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=860,736,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4484/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=860,928,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4485/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=861,120,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4486/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=861,312,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4487/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=861,504,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4488/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=861,696,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4489/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=861,888,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4490/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=862,080,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4491/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=862,272,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=4492/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=862,464,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=4493/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=862,656,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=4494/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=862,848,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=4495/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=863,040,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=4496/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=863,232,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=4497/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=863,424,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=4498/500000]
+ train/ActionNoiseL2Loss=0.1459
+ throughput/total_tokens=863,616,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=4499/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=863,808,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=4500/500000]
+ optim/total_grad_norm=1.787
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=864,000,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+10/03 [19:17:20] INFO | >> Saving config... checkpoint.py:608
+10/03 [19:17:53] INFO | >> Saving model state... checkpoint.py:796
+10/03 [19:19:04] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [19:20:36] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4501/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=864,192,000
+ throughput/device/tokens_per_second=1,192
+ throughput/device/batches_per_second=0.0497
+[step=4502/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=864,384,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=4503/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=864,576,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=4504/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=864,768,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=4505/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=864,960,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=4506/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=865,152,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=4507/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=865,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4508/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=865,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4509/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=865,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4510/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=865,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4511/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=866,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4512/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=866,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4513/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=866,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4514/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=866,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4515/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=866,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4516/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=867,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4517/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=867,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4518/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=867,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4519/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=867,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4520/500000]
+ optim/total_grad_norm=1.375
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=867,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4521/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=868,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4522/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=868,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4523/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=868,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4524/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=868,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4525/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=868,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4526/500000]
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=868,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4527/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=869,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4528/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=869,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4529/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=869,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4530/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=869,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4531/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=869,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4532/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=870,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4533/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=870,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4534/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=870,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4535/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=870,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4536/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=870,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4537/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=871,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4538/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=871,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4539/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=871,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4540/500000]
+ optim/total_grad_norm=1.985
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=871,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4541/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=871,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4542/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=872,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4543/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=872,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4544/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=872,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4545/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=872,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4546/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=872,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4547/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=873,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4548/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=873,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4549/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=873,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4550/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=873,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4551/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=873,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4552/500000]
+ train/ActionNoiseL2Loss=0.1646
+ throughput/total_tokens=873,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4553/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=874,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4554/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=874,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4555/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=874,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4556/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=874,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4557/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=874,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4558/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=875,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4559/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=875,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4560/500000]
+ optim/total_grad_norm=1.438
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=875,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4561/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=875,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4562/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=875,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4563/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=876,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4564/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=876,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4565/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=876,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4566/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=876,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4567/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=876,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4568/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=877,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4569/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=877,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4570/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=877,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4571/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=877,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4572/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=877,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4573/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=878,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4574/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=878,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4575/500000]
+ train/ActionNoiseL2Loss=0.1709
+ throughput/total_tokens=878,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4576/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=878,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4577/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=878,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4578/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=878,976,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4579/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=879,168,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4580/500000]
+ optim/total_grad_norm=1.034
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=879,360,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4581/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=879,552,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4582/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=879,744,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4583/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=879,936,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4584/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=880,128,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4585/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=880,320,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4586/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=880,512,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4587/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=880,704,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4588/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=880,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4589/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=881,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4590/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=881,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4591/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=881,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4592/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=881,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4593/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=881,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4594/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=882,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4595/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=882,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4596/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=882,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4597/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=882,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4598/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=882,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4599/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=883,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4600/500000]
+ optim/total_grad_norm=1.679
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=883,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4601/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=883,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4602/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=883,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4603/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=883,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4604/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=883,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4605/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=884,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4606/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=884,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4607/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=884,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4608/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=884,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4609/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=884,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4610/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=885,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4611/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=885,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4612/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=885,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4613/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=885,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4614/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=885,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4615/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=886,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4616/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=886,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4617/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=886,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4618/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=886,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4619/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=886,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4620/500000]
+ optim/total_grad_norm=1.245
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=887,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4621/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=887,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4622/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=887,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4623/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=887,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4624/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=887,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4625/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=888,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4626/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=888,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4627/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=888,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4628/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=888,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4629/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=888,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4630/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=888,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4631/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=889,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4632/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=889,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4633/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=889,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4634/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=889,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4635/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=889,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4636/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=890,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4637/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=890,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4638/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=890,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4639/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=890,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4640/500000]
+ optim/total_grad_norm=1.994
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=890,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4641/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=891,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4642/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=891,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4643/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=891,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4644/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=891,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4645/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=891,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4646/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=892,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4647/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=892,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4648/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=892,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4649/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=892,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4650/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=892,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4651/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=892,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4652/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=893,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4653/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=893,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4654/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=893,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4655/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=893,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4656/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=893,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4657/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=894,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4658/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=894,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4659/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=894,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4660/500000]
+ optim/total_grad_norm=2.451
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=894,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4661/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=894,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4662/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=895,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4663/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=895,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4664/500000]
+ train/ActionNoiseL2Loss=0.2077
+ throughput/total_tokens=895,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4665/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=895,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4666/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=895,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4667/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=896,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4668/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=896,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4669/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=896,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4670/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=896,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4671/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=896,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4672/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=897,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4673/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=897,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4674/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=897,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4675/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=897,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4676/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=897,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4677/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=897,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4678/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=898,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4679/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=898,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4680/500000]
+ optim/total_grad_norm=1.369
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=898,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4681/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=898,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4682/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=898,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4683/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=899,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4684/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=899,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4685/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=899,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4686/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=899,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4687/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=899,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4688/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=900,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4689/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=900,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4690/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=900,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4691/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=900,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4692/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=900,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4693/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=901,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4694/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=901,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4695/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=901,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4696/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=901,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4697/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=901,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4698/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=902,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4699/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=902,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4700/500000]
+ optim/total_grad_norm=1.705
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=902,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4701/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=902,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4702/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=902,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4703/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=902,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4704/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=903,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4705/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=903,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4706/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=903,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4707/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=903,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4708/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=903,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4709/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=904,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4710/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=904,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4711/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=904,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4712/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=904,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4713/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=904,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4714/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=905,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4715/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=905,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4716/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=905,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4717/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=905,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4718/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=905,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4719/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=906,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4720/500000]
+ optim/total_grad_norm=2.278
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=906,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4721/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=906,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4722/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=906,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4723/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=906,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4724/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=907,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4725/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=907,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4726/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=907,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4727/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=907,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4728/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=907,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4729/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=907,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4730/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=908,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4731/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=908,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4732/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=908,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4733/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=908,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4734/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=908,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4735/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=909,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4736/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=909,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4737/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=909,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4738/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=909,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4739/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=909,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4740/500000]
+ optim/total_grad_norm=1.834
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=910,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4741/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=910,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4742/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=910,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4743/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=910,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4744/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=910,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4745/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=911,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4746/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=911,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4747/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=911,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4748/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=911,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4749/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=911,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4750/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=912,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4751/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=912,192,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4752/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=912,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4753/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=912,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4754/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=912,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4755/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=912,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4756/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=913,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4757/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=913,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4758/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=913,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4759/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=913,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4760/500000]
+ optim/total_grad_norm=1.801
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=913,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4761/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=914,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4762/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=914,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4763/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=914,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4764/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=914,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4765/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=914,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4766/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=915,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4767/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=915,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4768/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=915,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4769/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=915,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4770/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=915,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4771/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=916,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4772/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=916,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4773/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=916,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4774/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=916,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4775/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=916,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4776/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=916,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4777/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=917,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4778/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=917,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4779/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=917,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4780/500000]
+ optim/total_grad_norm=2.511
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=917,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4781/500000]
+ train/ActionNoiseL2Loss=0.1490
+ throughput/total_tokens=917,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4782/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=918,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4783/500000]
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=918,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4784/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=918,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4785/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=918,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4786/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=918,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4787/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=919,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4788/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=919,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4789/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=919,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4790/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=919,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4791/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=919,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4792/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=920,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4793/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=920,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4794/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=920,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4795/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=920,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4796/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=920,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4797/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=921,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4798/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=921,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4799/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=921,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4800/500000]
+ optim/total_grad_norm=1.738
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=921,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4801/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=921,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4802/500000]
+ train/ActionNoiseL2Loss=0.1835
+ throughput/total_tokens=921,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4803/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=922,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4804/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=922,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4805/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=922,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4806/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=922,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4807/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=922,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4808/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=923,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4809/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=923,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4810/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=923,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4811/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=923,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4812/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=923,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4813/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=924,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4814/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=924,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4815/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=924,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4816/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=924,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4817/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=924,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4818/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=925,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4819/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=925,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4820/500000]
+ optim/total_grad_norm=1.593
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=925,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4821/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=925,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4822/500000]
+ train/ActionNoiseL2Loss=0.1585
+ throughput/total_tokens=925,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4823/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=926,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4824/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=926,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4825/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=926,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4826/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=926,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4827/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=926,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4828/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=926,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4829/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=927,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4830/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=927,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4831/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=927,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4832/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=927,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4833/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=927,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4834/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=928,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4835/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=928,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4836/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=928,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4837/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=928,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4838/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=928,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4839/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=929,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4840/500000]
+ optim/total_grad_norm=1.439
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=929,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4841/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=929,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4842/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=929,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4843/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=929,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4844/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=930,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4845/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=930,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4846/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=930,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4847/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=930,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4848/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=930,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4849/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=931,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4850/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=931,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4851/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=931,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4852/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=931,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4853/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=931,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4854/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=931,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4855/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=932,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4856/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=932,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4857/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=932,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4858/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=932,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4859/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=932,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4860/500000]
+ optim/total_grad_norm=2.624
+ train/ActionNoiseL2Loss=0.1796
+ throughput/total_tokens=933,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4861/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=933,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4862/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=933,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4863/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=933,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4864/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=933,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4865/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=934,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4866/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=934,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4867/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=934,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4868/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=934,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4869/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=934,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=4870/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=935,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4871/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=935,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4872/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=935,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4873/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=935,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4874/500000]
+ train/ActionNoiseL2Loss=0.2137
+ throughput/total_tokens=935,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4875/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=936,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4876/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=936,192,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4877/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=936,384,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4878/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=936,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4879/500000]
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=936,768,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4880/500000]
+ optim/total_grad_norm=1.445
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=936,960,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4881/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=937,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=4882/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=937,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4883/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=937,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4884/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=937,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4885/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=937,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4886/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=938,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4887/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=938,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4888/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=938,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4889/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=938,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4890/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=938,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4891/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=939,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4892/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=939,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4893/500000]
+ train/ActionNoiseL2Loss=0.1553
+ throughput/total_tokens=939,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4894/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=939,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4895/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=939,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4896/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=940,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4897/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=940,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4898/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=940,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4899/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=940,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4900/500000]
+ optim/total_grad_norm=1.316
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=940,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4901/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=940,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4902/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=941,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4903/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=941,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4904/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=941,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4905/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=941,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4906/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=941,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4907/500000]
+ train/ActionNoiseL2Loss=0.1427
+ throughput/total_tokens=942,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4908/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=942,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4909/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=942,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4910/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=942,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4911/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=942,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4912/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=943,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4913/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=943,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4914/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=943,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4915/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=943,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4916/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=943,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4917/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=944,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4918/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=944,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4919/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=944,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4920/500000]
+ optim/total_grad_norm=1.323
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=944,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4921/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=944,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4922/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=945,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4923/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=945,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4924/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=945,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4925/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=945,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4926/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=945,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4927/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=945,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4928/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=946,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4929/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=946,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4930/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=946,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4931/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=946,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4932/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=946,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4933/500000]
+ train/ActionNoiseL2Loss=0.1755
+ throughput/total_tokens=947,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4934/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=947,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4935/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=947,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4936/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=947,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4937/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=947,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4938/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=948,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4939/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=948,288,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4940/500000]
+ optim/total_grad_norm=1.506
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=948,480,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4941/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=948,672,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4942/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=948,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4943/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=949,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4944/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=949,248,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4945/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=949,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4946/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=949,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4947/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=949,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4948/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=950,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4949/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=950,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4950/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=950,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4951/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=950,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4952/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=950,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4953/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=950,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4954/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=951,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4955/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=951,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4956/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=951,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4957/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=951,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4958/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=951,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4959/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=952,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4960/500000]
+ optim/total_grad_norm=2.075
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=952,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4961/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=952,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4962/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=952,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4963/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=952,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4964/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=953,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4965/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=953,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4966/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=953,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4967/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=953,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4968/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=953,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4969/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=954,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4970/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=954,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=4971/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=954,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4972/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=954,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4973/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=954,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4974/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=955,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4975/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=955,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4976/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=955,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4977/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=955,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4978/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=955,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4979/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=955,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4980/500000]
+ optim/total_grad_norm=1.850
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=956,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4981/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=956,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4982/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=956,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4983/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=956,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4984/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=956,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4985/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=957,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4986/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=957,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4987/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=957,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4988/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=957,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4989/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=957,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4990/500000]
+ train/ActionNoiseL2Loss=0.1463
+ throughput/total_tokens=958,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=4991/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=958,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4992/500000]
+ train/ActionNoiseL2Loss=0.1363
+ throughput/total_tokens=958,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4993/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=958,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4994/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=958,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=4995/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=959,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4996/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=959,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4997/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=959,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4998/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=959,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4999/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=959,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5000/500000]
+ optim/total_grad_norm=2.112
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=960,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+10/03 [22:14:14] INFO | >> Saving config... checkpoint.py:608
+10/03 [22:15:06] INFO | >> Saving model state... checkpoint.py:796
+10/03 [22:16:15] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [22:17:50] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5001/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=960,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5002/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=960,384,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0488
+[step=5003/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=960,576,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=5004/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=960,768,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5005/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=960,960,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5006/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=961,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=5007/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=961,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5008/500000]
+ train/ActionNoiseL2Loss=0.2024
+ throughput/total_tokens=961,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5009/500000]
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=961,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5010/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=961,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5011/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=962,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5012/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=962,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5013/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=962,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5014/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=962,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5015/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=962,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5016/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=963,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5017/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=963,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5018/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=963,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5019/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=963,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5020/500000]
+ optim/total_grad_norm=1.373
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=963,840,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5021/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=964,032,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5022/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=964,224,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5023/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=964,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5024/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=964,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5025/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=964,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5026/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=964,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5027/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=965,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5028/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=965,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5029/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=965,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5030/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=965,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5031/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=965,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5032/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=966,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5033/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=966,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5034/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=966,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5035/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=966,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5036/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=966,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5037/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=967,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5038/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=967,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5039/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=967,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5040/500000]
+ optim/total_grad_norm=1.413
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=967,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5041/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=967,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5042/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=968,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5043/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=968,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5044/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=968,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5045/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=968,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5046/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=968,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5047/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=969,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5048/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=969,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5049/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=969,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5050/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=969,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5051/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=969,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5052/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=969,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5053/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=970,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5054/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=970,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5055/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=970,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5056/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=970,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5057/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=970,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5058/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=971,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5059/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=971,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5060/500000]
+ optim/total_grad_norm=1.536
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=971,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5061/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=971,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5062/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=971,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5063/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=972,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5064/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=972,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5065/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=972,480,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5066/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=972,672,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5067/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=972,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5068/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=973,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5069/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=973,248,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5070/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=973,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5071/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=973,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5072/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=973,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5073/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=974,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5074/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=974,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5075/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=974,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5076/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=974,592,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5077/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=974,784,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5078/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=974,976,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5079/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=975,168,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5080/500000]
+ optim/total_grad_norm=1.667
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=975,360,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5081/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=975,552,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5082/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=975,744,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5083/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=975,936,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5084/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=976,128,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5085/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=976,320,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5086/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=976,512,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5087/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=976,704,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5088/500000]
+ train/ActionNoiseL2Loss=0.1375
+ throughput/total_tokens=976,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5089/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=977,088,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5090/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=977,280,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5091/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=977,472,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5092/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=977,664,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5093/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=977,856,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5094/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=978,048,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5095/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=978,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5096/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=978,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5097/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=978,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5098/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=978,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5099/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=979,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5100/500000]
+ optim/total_grad_norm=1.566
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=979,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5101/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=979,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5102/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=979,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5103/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=979,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5104/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=979,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5105/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=980,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5106/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=980,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5107/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=980,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5108/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=980,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5109/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=980,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5110/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=981,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5111/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=981,312,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5112/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=981,504,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5113/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=981,696,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5114/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=981,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5115/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=982,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5116/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=982,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5117/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=982,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5118/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=982,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5119/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=982,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5120/500000]
+ optim/total_grad_norm=1.295
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=983,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5121/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=983,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5122/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=983,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5123/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=983,616,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5124/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=983,808,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5125/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=984,000,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5126/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=984,192,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5127/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=984,384,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5128/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=984,576,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5129/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=984,768,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5130/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=984,960,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5131/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=985,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5132/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=985,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5133/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=985,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5134/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=985,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5135/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=985,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5136/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=986,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5137/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=986,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5138/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=986,496,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5139/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=986,688,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5140/500000]
+ optim/total_grad_norm=2.293
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=986,880,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=5141/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=987,072,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5142/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=987,264,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5143/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=987,456,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5144/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=987,648,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5145/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=987,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5146/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=988,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5147/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=988,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5148/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=988,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5149/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=988,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5150/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=988,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5151/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=988,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5152/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=989,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5153/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=989,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5154/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=989,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5155/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=989,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5156/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=989,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5157/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=990,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5158/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=990,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5159/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=990,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5160/500000]
+ optim/total_grad_norm=1.835
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=990,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5161/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=990,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5162/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=991,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5163/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=991,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5164/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=991,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5165/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=991,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5166/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=991,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5167/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=992,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5168/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=992,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5169/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=992,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5170/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=992,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5171/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=992,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5172/500000]
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=993,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5173/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=993,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5174/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=993,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5175/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=993,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5176/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=993,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5177/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=993,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5178/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=994,176,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5179/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=994,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5180/500000]
+ optim/total_grad_norm=1.254
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=994,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5181/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=994,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5182/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=994,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5183/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=995,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5184/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=995,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5185/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=995,520,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5186/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=995,712,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5187/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=995,904,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5188/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=996,096,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5189/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=996,288,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5190/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=996,480,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5191/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=996,672,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5192/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=996,864,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5193/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=997,056,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5194/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=997,248,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5195/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=997,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5196/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=997,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5197/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=997,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5198/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=998,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5199/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=998,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5200/500000]
+ optim/total_grad_norm=1.679
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=998,400,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5201/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=998,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5202/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=998,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5203/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=998,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5204/500000]
+ train/ActionNoiseL2Loss=0.1535
+ throughput/total_tokens=999,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5205/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=999,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5206/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=999,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5207/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=999,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5208/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=999,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5209/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,000,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5210/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,000,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5211/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,000,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5212/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,000,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5213/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=1,000,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5214/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=1,001,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5215/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,001,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5216/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,001,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5217/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=1,001,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5218/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,001,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5219/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=1,002,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5220/500000]
+ optim/total_grad_norm=1.422
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,002,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5221/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,002,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5222/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,002,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=5223/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=1,002,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5224/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=1,003,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5225/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=1,003,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5226/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,003,392,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5227/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,003,584,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5228/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,003,776,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5229/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,003,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5230/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,004,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5231/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,004,352,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5232/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=1,004,544,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5233/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,004,736,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5234/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,004,928,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5235/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=1,005,120,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5236/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,005,312,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5237/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,005,504,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5238/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=1,005,696,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5239/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,005,888,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5240/500000]
+ optim/total_grad_norm=1.026
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,006,080,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5241/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=1,006,272,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5242/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,006,464,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5243/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,006,656,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5244/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=1,006,848,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5245/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,007,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5246/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,007,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5247/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,007,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5248/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=1,007,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5249/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,007,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5250/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,008,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5251/500000]
+ train/ActionNoiseL2Loss=0.1507
+ throughput/total_tokens=1,008,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5252/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,008,384,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5253/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,008,576,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5254/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,008,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5255/500000]
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=1,008,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5256/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,009,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5257/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,009,344,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5258/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=1,009,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5259/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=1,009,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5260/500000]
+ optim/total_grad_norm=1.609
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,009,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5261/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,010,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5262/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,010,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5263/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=1,010,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5264/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,010,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5265/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,010,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5266/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,011,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5267/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,011,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5268/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,011,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5269/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,011,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5270/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=1,011,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5271/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,012,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5272/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,012,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5273/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,012,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5274/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,012,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5275/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,012,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5276/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,012,992,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5277/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=1,013,184,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5278/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=1,013,376,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5279/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,013,568,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5280/500000]
+ optim/total_grad_norm=1.695
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=1,013,760,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5281/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,013,952,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5282/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,014,144,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5283/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=1,014,336,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5284/500000]
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=1,014,528,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5285/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=1,014,720,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5286/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=1,014,912,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5287/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,015,104,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5288/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,015,296,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5289/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,015,488,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5290/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,015,680,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5291/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,015,872,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5292/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,016,064,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5293/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,016,256,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5294/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,016,448,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5295/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,016,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5296/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,016,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5297/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,017,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5298/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,017,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5299/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,017,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5300/500000]
+ optim/total_grad_norm=1.913
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=1,017,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5301/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=1,017,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5302/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=1,017,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5303/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,018,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5304/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,018,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5305/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,018,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5306/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,018,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5307/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=1,018,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5308/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,019,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5309/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,019,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5310/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=1,019,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5311/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,019,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5312/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,019,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5313/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,020,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5314/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,020,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5315/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,020,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5316/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,020,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5317/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,020,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5318/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,021,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5319/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,021,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5320/500000]
+ optim/total_grad_norm=1.500
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,021,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5321/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,021,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5322/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,021,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5323/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=1,022,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5324/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,022,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5325/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,022,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5326/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,022,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5327/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,022,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5328/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,022,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5329/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,023,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5330/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,023,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5331/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,023,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5332/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=1,023,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5333/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,023,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5334/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,024,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5335/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,024,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5336/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,024,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5337/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,024,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5338/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,024,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5339/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,025,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5340/500000]
+ optim/total_grad_norm=1.321
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,025,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5341/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,025,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5342/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,025,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=5343/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,025,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=5344/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,026,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5345/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,026,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5346/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=1,026,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5347/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,026,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5348/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,026,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5349/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,027,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5350/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,027,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5351/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=1,027,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5352/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,027,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5353/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=1,027,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5354/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,027,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5355/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,028,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5356/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=1,028,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5357/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,028,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5358/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=1,028,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5359/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,028,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5360/500000]
+ optim/total_grad_norm=1.730
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=1,029,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5361/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=1,029,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5362/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,029,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5363/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=1,029,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5364/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=1,029,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5365/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=1,030,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5366/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,030,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5367/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,030,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5368/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,030,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5369/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,030,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5370/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,031,040,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=5371/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,031,232,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5372/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,031,424,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5373/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,031,616,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5374/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=1,031,808,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5375/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,032,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5376/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,032,192,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5377/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,032,384,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5378/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,032,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5379/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,032,768,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5380/500000]
+ optim/total_grad_norm=2.114
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,032,960,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5381/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,033,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5382/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,033,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5383/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,033,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5384/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=1,033,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5385/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=1,033,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5386/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=1,034,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5387/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,034,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5388/500000]
+ train/ActionNoiseL2Loss=0.1881
+ throughput/total_tokens=1,034,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5389/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=1,034,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5390/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,034,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5391/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=1,035,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5392/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,035,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5393/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,035,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5394/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,035,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5395/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,035,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5396/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,036,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5397/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,036,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5398/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,036,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5399/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,036,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5400/500000]
+ optim/total_grad_norm=1.438
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,036,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5401/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,036,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5402/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,037,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5403/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,037,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5404/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=1,037,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5405/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,037,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5406/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,037,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5407/500000]
+ train/ActionNoiseL2Loss=0.1577
+ throughput/total_tokens=1,038,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5408/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,038,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5409/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,038,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5410/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,038,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5411/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,038,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5412/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,039,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5413/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,039,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5414/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,039,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5415/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,039,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5416/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,039,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5417/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,040,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5418/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,040,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5419/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,040,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5420/500000]
+ optim/total_grad_norm=1.185
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,040,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5421/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,040,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5422/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,041,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5423/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=1,041,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5424/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,041,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5425/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,041,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5426/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,041,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5427/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,041,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5428/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,042,176,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5429/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,042,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5430/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,042,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5431/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,042,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5432/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,042,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5433/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,043,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5434/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,043,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5435/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,043,520,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5436/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,043,712,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5437/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,043,904,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5438/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,044,096,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5439/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,044,288,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5440/500000]
+ optim/total_grad_norm=1.951
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,044,480,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5441/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,044,672,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5442/500000]
+ train/ActionNoiseL2Loss=0.1191
+ throughput/total_tokens=1,044,864,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5443/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,045,056,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5444/500000]
+ train/ActionNoiseL2Loss=0.1877
+ throughput/total_tokens=1,045,248,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5445/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,045,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5446/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,045,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5447/500000]
+ train/ActionNoiseL2Loss=0.1709
+ throughput/total_tokens=1,045,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5448/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,046,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5449/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,046,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5450/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,046,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5451/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,046,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5452/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,046,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5453/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=1,046,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5454/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,047,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5455/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,047,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5456/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=1,047,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5457/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,047,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5458/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,047,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5459/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,048,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5460/500000]
+ optim/total_grad_norm=1.605
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,048,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5461/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,048,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5462/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,048,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5463/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,048,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5464/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,049,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5465/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,049,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5466/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,049,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5467/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,049,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5468/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,049,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5469/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,050,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5470/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,050,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5471/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=1,050,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5472/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,050,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5473/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,050,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5474/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,051,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5475/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,051,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5476/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,051,392,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5477/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,051,584,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5478/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,051,776,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5479/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,051,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5480/500000]
+ optim/total_grad_norm=1.459
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,052,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5481/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,052,352,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5482/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,052,544,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5483/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=1,052,736,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5484/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=1,052,928,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5485/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,053,120,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5486/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=1,053,312,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5487/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,053,504,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5488/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,053,696,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5489/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,053,888,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5490/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,054,080,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5491/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,054,272,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5492/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,054,464,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5493/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=1,054,656,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5494/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,054,848,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5495/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,055,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5496/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=1,055,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5497/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=1,055,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5498/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,055,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5499/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,055,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5500/500000]
+ optim/total_grad_norm=1.256
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,056,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/04 [01:11:15] INFO | >> Saving config... checkpoint.py:608
+10/04 [01:12:00] INFO | >> Saving model state... checkpoint.py:796
+10/04 [01:13:15] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [01:14:48] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5501/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=1,056,192,000
+ throughput/device/tokens_per_second=1,197
+ throughput/device/batches_per_second=0.0499
+[step=5502/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=1,056,384,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=5503/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=1,056,576,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=5504/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,056,768,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=5505/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=1,056,960,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=5506/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,057,152,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=5507/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,057,344,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=5508/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,057,536,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=5509/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,057,728,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=5510/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,057,920,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=5511/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,058,112,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5512/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,058,304,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5513/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,058,496,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5514/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=1,058,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5515/500000]
+ train/ActionNoiseL2Loss=0.1475
+ throughput/total_tokens=1,058,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5516/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,059,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5517/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=1,059,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5518/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=1,059,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5519/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,059,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5520/500000]
+ optim/total_grad_norm=1.585
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,059,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5521/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,060,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5522/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=1,060,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5523/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,060,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5524/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,060,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5525/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,060,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5526/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=1,060,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5527/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=1,061,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5528/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,061,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5529/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,061,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5530/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=1,061,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5531/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,061,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5532/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,062,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5533/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=1,062,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5534/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,062,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5535/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=1,062,720,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5536/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,062,912,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5537/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,063,104,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5538/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,063,296,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5539/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,063,488,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5540/500000]
+ optim/total_grad_norm=2.358
+ train/ActionNoiseL2Loss=0.1783
+ throughput/total_tokens=1,063,680,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5541/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,063,872,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5542/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=1,064,064,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5543/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,064,256,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5544/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,064,448,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5545/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=1,064,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5546/500000]
+ train/ActionNoiseL2Loss=0.1228
+ throughput/total_tokens=1,064,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5547/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,065,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5548/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,065,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5549/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,065,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5550/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,065,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5551/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,065,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5552/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,065,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5553/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,066,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5554/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=1,066,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5555/500000]
+ train/ActionNoiseL2Loss=0.1753
+ throughput/total_tokens=1,066,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5556/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,066,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5557/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,066,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5558/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,067,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5559/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,067,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5560/500000]
+ optim/total_grad_norm=2.424
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=1,067,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5561/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,067,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5562/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,067,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5563/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,068,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5564/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,068,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5565/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,068,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5566/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,068,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5567/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=1,068,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5568/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,069,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5569/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,069,248,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5570/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,069,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5571/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=1,069,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5572/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,069,824,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5573/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,070,016,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5574/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,070,208,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5575/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,070,400,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5576/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=1,070,592,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5577/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=1,070,784,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5578/500000]
+ train/ActionNoiseL2Loss=0.1528
+ throughput/total_tokens=1,070,976,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5579/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,071,168,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5580/500000]
+ optim/total_grad_norm=1.303
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,071,360,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=5581/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=1,071,552,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5582/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,071,744,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5583/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=1,071,936,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5584/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,072,128,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5585/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,072,320,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5586/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,072,512,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5587/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,072,704,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5588/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,072,896,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5589/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,073,088,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5590/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,073,280,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=5591/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,073,472,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5592/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,073,664,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5593/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=1,073,856,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5594/500000]
+ train/ActionNoiseL2Loss=0.1641
+ throughput/total_tokens=1,074,048,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5595/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=1,074,240,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5596/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,074,432,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5597/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,074,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5598/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,074,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5599/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,075,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5600/500000]
+ optim/total_grad_norm=1.487
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=1,075,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5601/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,075,392,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5602/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=1,075,584,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5603/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,075,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5604/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,075,968,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5605/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,076,160,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5606/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,076,352,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5607/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,076,544,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5608/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,076,736,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5609/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,076,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5610/500000]
+ train/ActionNoiseL2Loss=0.2033
+ throughput/total_tokens=1,077,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5611/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,077,312,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5612/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,077,504,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5613/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,077,696,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5614/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,077,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5615/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=1,078,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5616/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=1,078,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5617/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=1,078,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5618/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,078,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5619/500000]
+ train/ActionNoiseL2Loss=0.1433
+ throughput/total_tokens=1,078,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5620/500000]
+ optim/total_grad_norm=1.563
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,079,040,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=5621/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,079,232,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5622/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,079,424,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5623/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,079,616,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5624/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,079,808,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5625/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,080,000,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5626/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,080,192,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5627/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=1,080,384,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5628/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,080,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5629/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=1,080,768,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5630/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,080,960,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5631/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,081,152,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5632/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,081,344,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5633/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,081,536,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5634/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,081,728,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5635/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=1,081,920,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5636/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,082,112,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5637/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,082,304,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5638/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,082,496,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5639/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,082,688,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5640/500000]
+ optim/total_grad_norm=1.495
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,082,880,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=5641/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,083,072,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5642/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,083,264,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5643/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,083,456,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5644/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,083,648,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5645/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,083,840,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5646/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=1,084,032,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5647/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,084,224,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5648/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,084,416,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=5649/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,084,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5650/500000]
+ train/ActionNoiseL2Loss=0.1363
+ throughput/total_tokens=1,084,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5651/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,084,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5652/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,085,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5653/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=1,085,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5654/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,085,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5655/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=1,085,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5656/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,085,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5657/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,086,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5658/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,086,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5659/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,086,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5660/500000]
+ optim/total_grad_norm=2.074
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=1,086,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5661/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,086,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5662/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,087,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5663/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,087,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5664/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,087,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5665/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=1,087,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5666/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,087,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5667/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,088,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5668/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,088,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5669/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=1,088,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5670/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,088,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5671/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,088,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5672/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,089,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5673/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=1,089,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5674/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=1,089,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5675/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,089,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5676/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=1,089,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5677/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=1,089,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5678/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,090,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5679/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=1,090,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5680/500000]
+ optim/total_grad_norm=1.948
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=1,090,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5681/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,090,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5682/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,090,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5683/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=1,091,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5684/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,091,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5685/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,091,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5686/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,091,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5687/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,091,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5688/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=1,092,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5689/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,092,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5690/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=1,092,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5691/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,092,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5692/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=1,092,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5693/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,093,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5694/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,093,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5695/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=1,093,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5696/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,093,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5697/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=1,093,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5698/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,094,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5699/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,094,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5700/500000]
+ optim/total_grad_norm=1.882
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=1,094,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5701/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,094,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5702/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,094,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5703/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=1,094,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5704/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,095,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5705/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,095,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5706/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=1,095,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5707/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=1,095,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5708/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,095,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5709/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,096,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5710/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,096,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5711/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,096,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5712/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=1,096,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5713/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,096,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5714/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,097,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5715/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,097,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5716/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=1,097,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5717/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,097,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5718/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,097,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5719/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,098,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5720/500000]
+ optim/total_grad_norm=1.559
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,098,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5721/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=1,098,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5722/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,098,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5723/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,098,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5724/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,099,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5725/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,099,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5726/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,099,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5727/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,099,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5728/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,099,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5729/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,099,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5730/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,100,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5731/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,100,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5732/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,100,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5733/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=1,100,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5734/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=1,100,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5735/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,101,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5736/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,101,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5737/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=1,101,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5738/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,101,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5739/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,101,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5740/500000]
+ optim/total_grad_norm=1.889
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,102,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5741/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,102,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5742/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=1,102,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5743/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,102,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5744/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,102,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5745/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=1,103,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5746/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,103,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5747/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,103,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5748/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,103,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5749/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,103,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5750/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,104,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5751/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,104,192,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5752/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,104,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5753/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=1,104,576,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5754/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,104,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5755/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,104,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5756/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,105,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5757/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,105,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5758/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,105,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5759/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,105,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5760/500000]
+ optim/total_grad_norm=1.489
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,105,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5761/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,106,112,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5762/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,106,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5763/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,106,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5764/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,106,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5765/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,106,880,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5766/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=1,107,072,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5767/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,107,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5768/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,107,456,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5769/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=1,107,648,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5770/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,107,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5771/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,108,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5772/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=1,108,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5773/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,108,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5774/500000]
+ train/ActionNoiseL2Loss=0.1874
+ throughput/total_tokens=1,108,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5775/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,108,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5776/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,108,992,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5777/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,109,184,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5778/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,109,376,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5779/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,109,568,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5780/500000]
+ optim/total_grad_norm=1.615
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,109,760,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5781/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,109,952,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5782/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,110,144,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5783/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,110,336,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5784/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=1,110,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5785/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,110,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5786/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,110,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5787/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,111,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5788/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,111,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5789/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,111,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5790/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,111,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5791/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,111,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5792/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,112,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5793/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,112,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5794/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,112,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5795/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,112,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5796/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,112,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5797/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,113,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5798/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,113,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5799/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,113,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5800/500000]
+ optim/total_grad_norm=1.816
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=1,113,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5801/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,113,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5802/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,113,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5803/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,114,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5804/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=1,114,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5805/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,114,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5806/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,114,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5807/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=1,114,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5808/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,115,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5809/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,115,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5810/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,115,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5811/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,115,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5812/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,115,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5813/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,116,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5814/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,116,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5815/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,116,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5816/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,116,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5817/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,116,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5818/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,117,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5819/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,117,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5820/500000]
+ optim/total_grad_norm=1.344
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=1,117,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5821/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,117,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5822/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=1,117,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5823/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,118,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5824/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,118,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5825/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,118,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5826/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,118,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5827/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,118,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5828/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,118,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5829/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,119,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5830/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,119,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5831/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,119,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5832/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=1,119,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5833/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,119,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5834/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,120,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5835/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,120,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5836/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,120,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5837/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,120,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5838/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,120,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5839/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,121,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5840/500000]
+ optim/total_grad_norm=1.395
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,121,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5841/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,121,472,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5842/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,121,664,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5843/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,121,856,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5844/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=1,122,048,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5845/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,122,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5846/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=1,122,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5847/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,122,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5848/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,122,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5849/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=1,123,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5850/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,123,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5851/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,123,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5852/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,123,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5853/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=1,123,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5854/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,123,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5855/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,124,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5856/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,124,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5857/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,124,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5858/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,124,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5859/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,124,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5860/500000]
+ optim/total_grad_norm=1.961
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=1,125,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5861/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,125,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5862/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,125,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5863/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=1,125,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5864/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,125,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5865/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,126,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5866/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,126,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5867/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,126,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5868/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,126,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5869/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=1,126,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5870/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=1,127,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5871/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,127,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5872/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,127,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5873/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,127,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5874/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,127,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5875/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,128,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5876/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,128,192,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5877/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,128,384,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5878/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,128,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5879/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,128,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5880/500000]
+ optim/total_grad_norm=1.224
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,128,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5881/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=1,129,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5882/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,129,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5883/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,129,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5884/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,129,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5885/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,129,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5886/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,130,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5887/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,130,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5888/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,130,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5889/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,130,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5890/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,130,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5891/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,131,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5892/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,131,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5893/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,131,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5894/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,131,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5895/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=1,131,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5896/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,132,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5897/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,132,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5898/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,132,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5899/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,132,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5900/500000]
+ optim/total_grad_norm=1.362
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,132,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5901/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,132,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5902/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,133,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5903/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,133,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5904/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=1,133,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5905/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,133,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5906/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,133,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5907/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,134,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5908/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=1,134,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5909/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,134,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5910/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,134,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5911/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,134,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5912/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=1,135,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5913/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,135,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5914/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,135,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5915/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,135,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5916/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,135,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5917/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,136,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5918/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,136,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5919/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,136,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5920/500000]
+ optim/total_grad_norm=1.466
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=1,136,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5921/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,136,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5922/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,137,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5923/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,137,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5924/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,137,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5925/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,137,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5926/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,137,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5927/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,137,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5928/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,138,176,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5929/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,138,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5930/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,138,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5931/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,138,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5932/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,138,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5933/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,139,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5934/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,139,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5935/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,139,520,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5936/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=1,139,712,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5937/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,139,904,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5938/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,140,096,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5939/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,140,288,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5940/500000]
+ optim/total_grad_norm=1.815
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=1,140,480,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5941/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,140,672,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5942/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,140,864,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5943/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,141,056,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5944/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,141,248,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5945/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,141,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5946/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=1,141,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5947/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=1,141,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5948/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,142,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5949/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,142,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5950/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,142,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5951/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,142,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5952/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,142,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5953/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,142,976,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5954/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,143,168,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5955/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,143,360,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5956/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,143,552,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5957/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,143,744,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5958/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,143,936,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5959/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,144,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5960/500000]
+ optim/total_grad_norm=1.399
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,144,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=5961/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,144,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5962/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,144,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5963/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,144,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5964/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,145,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5965/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,145,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5966/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,145,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5967/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,145,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5968/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,145,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5969/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,146,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5970/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,146,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5971/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,146,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5972/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,146,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5973/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,146,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5974/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=1,147,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5975/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,147,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5976/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=1,147,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5977/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,147,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5978/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,147,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5979/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=1,147,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5980/500000]
+ optim/total_grad_norm=1.753
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,148,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5981/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,148,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5982/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,148,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5983/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,148,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5984/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,148,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5985/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,149,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5986/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,149,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5987/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,149,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5988/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=1,149,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5989/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=1,149,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5990/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,150,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=5991/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,150,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5992/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,150,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5993/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,150,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5994/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,150,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5995/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,151,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5996/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,151,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5997/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,151,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5998/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,151,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=5999/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=1,151,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6000/500000]
+ optim/total_grad_norm=1.637
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,152,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/04 [04:08:16] INFO | >> Saving config... checkpoint.py:608
+10/04 [04:09:00] INFO | >> Saving model state... checkpoint.py:796
+10/04 [04:10:14] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [04:11:47] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6001/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,152,192,000
+ throughput/device/tokens_per_second=1,198
+ throughput/device/batches_per_second=0.0499
+[step=6002/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,152,384,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=6003/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,152,576,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=6004/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,152,768,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=6005/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,152,960,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=6006/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=1,153,152,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=6007/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,153,344,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=6008/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,153,536,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=6009/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=1,153,728,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=6010/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=1,153,920,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=6011/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,154,112,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=6012/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,154,304,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=6013/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,154,496,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=6014/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,154,688,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=6015/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,154,880,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=6016/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,155,072,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=6017/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,155,264,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=6018/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,155,456,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=6019/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,155,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6020/500000]
+ optim/total_grad_norm=1.657
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,155,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6021/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,156,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6022/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=1,156,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6023/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=1,156,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6024/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,156,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6025/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,156,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6026/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,156,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6027/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,157,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6028/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,157,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6029/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,157,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6030/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,157,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6031/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,157,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6032/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,158,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6033/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,158,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6034/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,158,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6035/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,158,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6036/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,158,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6037/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,159,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6038/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,159,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6039/500000]
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=1,159,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6040/500000]
+ optim/total_grad_norm=1.274
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,159,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6041/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,159,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6042/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,160,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6043/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,160,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6044/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,160,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6045/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,160,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6046/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=1,160,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6047/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,161,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6048/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,161,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6049/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,161,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6050/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,161,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6051/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,161,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6052/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,161,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6053/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,162,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6054/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,162,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6055/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,162,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6056/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,162,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6057/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,162,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6058/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,163,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6059/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,163,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6060/500000]
+ optim/total_grad_norm=0.9795
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,163,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6061/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=1,163,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6062/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,163,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6063/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,164,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6064/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,164,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6065/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,164,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6066/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,164,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6067/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,164,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6068/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,165,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6069/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,165,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6070/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=1,165,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6071/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,165,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6072/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=1,165,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6073/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,166,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6074/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,166,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6075/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,166,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6076/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,166,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6077/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,166,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6078/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=1,166,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6079/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,167,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6080/500000]
+ optim/total_grad_norm=2.157
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=1,167,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6081/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,167,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6082/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,167,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6083/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,167,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6084/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,168,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6085/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,168,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6086/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,168,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6087/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,168,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6088/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,168,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6089/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,169,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6090/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,169,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6091/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=1,169,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6092/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,169,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6093/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,169,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6094/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,170,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6095/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,170,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6096/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,170,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6097/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,170,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6098/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,170,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6099/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=1,171,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6100/500000]
+ optim/total_grad_norm=1.513
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,171,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6101/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,171,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6102/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,171,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6103/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,171,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6104/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,171,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6105/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,172,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6106/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,172,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6107/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,172,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6108/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,172,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6109/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=1,172,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6110/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,173,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6111/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,173,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6112/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=1,173,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6113/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,173,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6114/500000]
+ train/ActionNoiseL2Loss=0.1458
+ throughput/total_tokens=1,173,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6115/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,174,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6116/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,174,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6117/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,174,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6118/500000]
+ train/ActionNoiseL2Loss=0.1581
+ throughput/total_tokens=1,174,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6119/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,174,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6120/500000]
+ optim/total_grad_norm=1.914
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=1,175,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6121/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=1,175,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6122/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,175,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6123/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,175,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6124/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,175,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6125/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=1,176,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6126/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,176,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6127/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=1,176,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6128/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,176,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6129/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,176,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6130/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,176,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6131/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,177,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6132/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,177,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6133/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=1,177,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6134/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=1,177,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6135/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,177,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6136/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,178,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6137/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=1,178,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6138/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,178,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6139/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,178,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6140/500000]
+ optim/total_grad_norm=1.701
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,178,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6141/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=1,179,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6142/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,179,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6143/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,179,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6144/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,179,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6145/500000]
+ train/ActionNoiseL2Loss=0.1612
+ throughput/total_tokens=1,179,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6146/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,180,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6147/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,180,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6148/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=1,180,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6149/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,180,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6150/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,180,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6151/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,180,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6152/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=1,181,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6153/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,181,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6154/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,181,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6155/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,181,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6156/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,181,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6157/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,182,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6158/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,182,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6159/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,182,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6160/500000]
+ optim/total_grad_norm=2.193
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=1,182,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6161/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,182,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6162/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,183,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6163/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,183,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6164/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=1,183,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6165/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,183,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6166/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,183,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6167/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=1,184,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6168/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=1,184,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6169/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,184,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6170/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,184,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6171/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,184,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6172/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=1,185,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6173/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=1,185,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6174/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,185,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6175/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,185,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6176/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=1,185,792,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6177/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,185,984,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6178/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,186,176,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6179/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=1,186,368,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6180/500000]
+ optim/total_grad_norm=1.494
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=1,186,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6181/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=1,186,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6182/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,186,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6183/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,187,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6184/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,187,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6185/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,187,520,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6186/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=1,187,712,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6187/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=1,187,904,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6188/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,188,096,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6189/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=1,188,288,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6190/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=1,188,480,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6191/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,188,672,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6192/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,188,864,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6193/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=1,189,056,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6194/500000]
+ train/ActionNoiseL2Loss=0.1822
+ throughput/total_tokens=1,189,248,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6195/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,189,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6196/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,189,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6197/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,189,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6198/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=1,190,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6199/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,190,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6200/500000]
+ optim/total_grad_norm=1.442
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,190,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6201/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,190,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6202/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,190,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6203/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,190,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6204/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,191,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6205/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=1,191,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6206/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=1,191,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6207/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,191,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6208/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,191,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6209/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,192,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6210/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,192,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6211/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,192,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6212/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=1,192,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6213/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,192,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6214/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,193,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6215/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=1,193,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6216/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,193,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6217/500000]
+ train/ActionNoiseL2Loss=0.1851
+ throughput/total_tokens=1,193,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6218/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,193,856,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6219/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=1,194,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6220/500000]
+ optim/total_grad_norm=1.267
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,194,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6221/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,194,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6222/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,194,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6223/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,194,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6224/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,195,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6225/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,195,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6226/500000]
+ train/ActionNoiseL2Loss=0.1691
+ throughput/total_tokens=1,195,392,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6227/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,195,584,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6228/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=1,195,776,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6229/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=1,195,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6230/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,196,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6231/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,196,352,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6232/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=1,196,544,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6233/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,196,736,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6234/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,196,928,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6235/500000]
+ train/ActionNoiseL2Loss=0.1592
+ throughput/total_tokens=1,197,120,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6236/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,197,312,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6237/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,197,504,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6238/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,197,696,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6239/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,197,888,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6240/500000]
+ optim/total_grad_norm=1.664
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,198,080,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6241/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,198,272,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6242/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,198,464,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6243/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,198,656,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6244/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,198,848,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6245/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,199,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6246/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,199,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6247/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,199,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6248/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=1,199,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6249/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,199,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6250/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,200,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6251/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,200,192,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6252/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,200,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6253/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,200,576,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6254/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,200,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6255/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=1,200,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6256/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=1,201,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6257/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=1,201,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6258/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,201,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6259/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,201,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6260/500000]
+ optim/total_grad_norm=1.045
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,201,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6261/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,202,112,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6262/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,202,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6263/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,202,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6264/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,202,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6265/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,202,880,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6266/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,203,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6267/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=1,203,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6268/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,203,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6269/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,203,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6270/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,203,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6271/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,204,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6272/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,204,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6273/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,204,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6274/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,204,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6275/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,204,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6276/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,204,992,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6277/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,205,184,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6278/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,205,376,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6279/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,205,568,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6280/500000]
+ optim/total_grad_norm=1.279
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,205,760,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6281/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,205,952,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6282/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,206,144,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6283/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=1,206,336,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6284/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,206,528,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6285/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,206,720,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6286/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=1,206,912,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6287/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=1,207,104,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6288/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,207,296,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6289/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,207,488,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6290/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,207,680,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6291/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,207,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6292/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,208,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6293/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,208,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6294/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,208,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6295/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,208,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6296/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,208,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6297/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=1,209,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6298/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,209,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6299/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=1,209,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6300/500000]
+ optim/total_grad_norm=1.681
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=1,209,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6301/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,209,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6302/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,209,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6303/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=1,210,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6304/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,210,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6305/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,210,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6306/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,210,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6307/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,210,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6308/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=1,211,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6309/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=1,211,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6310/500000]
+ train/ActionNoiseL2Loss=0.1327
+ throughput/total_tokens=1,211,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6311/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,211,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6312/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,211,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6313/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,212,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6314/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,212,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6315/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,212,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6316/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,212,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6317/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,212,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6318/500000]
+ train/ActionNoiseL2Loss=0.1649
+ throughput/total_tokens=1,213,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6319/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,213,248,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6320/500000]
+ optim/total_grad_norm=1.664
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,213,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6321/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,213,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6322/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,213,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6323/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=1,214,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6324/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=1,214,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6325/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,214,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6326/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,214,592,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6327/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,214,784,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6328/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,214,976,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6329/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,215,168,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6330/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,215,360,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6331/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=1,215,552,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6332/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,215,744,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6333/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,215,936,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6334/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,216,128,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6335/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,216,320,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6336/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,216,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6337/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,216,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6338/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,216,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6339/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,217,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6340/500000]
+ optim/total_grad_norm=1.321
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,217,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6341/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,217,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6342/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,217,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6343/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,217,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6344/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,218,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6345/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,218,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6346/500000]
+ train/ActionNoiseL2Loss=0.1789
+ throughput/total_tokens=1,218,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6347/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,218,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6348/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,218,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6349/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,219,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6350/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=1,219,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6351/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,219,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6352/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,219,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6353/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,219,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6354/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,219,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6355/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,220,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6356/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,220,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6357/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,220,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6358/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,220,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6359/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=1,220,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6360/500000]
+ optim/total_grad_norm=1.809
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=1,221,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6361/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,221,312,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6362/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,221,504,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6363/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=1,221,696,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6364/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,221,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6365/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,222,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6366/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,222,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6367/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,222,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6368/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,222,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6369/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,222,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6370/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,223,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6371/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,223,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6372/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,223,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6373/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=1,223,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6374/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,223,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6375/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,224,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6376/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,224,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6377/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,224,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6378/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,224,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6379/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,224,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6380/500000]
+ optim/total_grad_norm=1.292
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,224,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6381/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,225,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6382/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,225,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6383/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,225,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6384/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,225,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6385/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,225,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6386/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,226,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6387/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,226,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6388/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,226,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6389/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,226,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6390/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,226,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6391/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,227,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6392/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,227,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6393/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=1,227,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6394/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,227,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6395/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,227,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6396/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=1,228,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6397/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,228,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6398/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,228,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6399/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,228,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6400/500000]
+ optim/total_grad_norm=1.326
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,228,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6401/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,228,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6402/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,229,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6403/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,229,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6404/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,229,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6405/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,229,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6406/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,229,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6407/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,230,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6408/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,230,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6409/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,230,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6410/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,230,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6411/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,230,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6412/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,231,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6413/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,231,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6414/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=1,231,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6415/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=1,231,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6416/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=1,231,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6417/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=1,232,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6418/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,232,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6419/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,232,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6420/500000]
+ optim/total_grad_norm=1.479
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=1,232,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6421/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=1,232,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6422/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,233,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6423/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,233,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6424/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,233,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6425/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,233,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6426/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,233,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6427/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,233,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6428/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,234,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6429/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,234,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6430/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,234,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6431/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,234,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6432/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,234,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6433/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=1,235,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6434/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,235,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6435/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,235,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6436/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,235,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6437/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,235,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6438/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,236,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6439/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,236,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6440/500000]
+ optim/total_grad_norm=1.219
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,236,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6441/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,236,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6442/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=1,236,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6443/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,237,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6444/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,237,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6445/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,237,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6446/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,237,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6447/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,237,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6448/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,238,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6449/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,238,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6450/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,238,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6451/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,238,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6452/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,238,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6453/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,238,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6454/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,239,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6455/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,239,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6456/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,239,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6457/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,239,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6458/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,239,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6459/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,240,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6460/500000]
+ optim/total_grad_norm=2.238
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=1,240,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6461/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,240,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6462/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,240,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6463/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,240,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6464/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,241,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6465/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,241,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6466/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,241,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6467/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=1,241,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6468/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,241,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6469/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,242,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6470/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,242,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6471/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,242,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6472/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,242,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6473/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=1,242,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6474/500000]
+ train/ActionNoiseL2Loss=0.1587
+ throughput/total_tokens=1,243,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6475/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,243,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6476/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,243,392,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6477/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,243,584,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6478/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,243,776,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6479/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,243,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6480/500000]
+ optim/total_grad_norm=1.355
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,244,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6481/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,244,352,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6482/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,244,544,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6483/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,244,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6484/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,244,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6485/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,245,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6486/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=1,245,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6487/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,245,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6488/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,245,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6489/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,245,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6490/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,246,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6491/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=1,246,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6492/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=1,246,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6493/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,246,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6494/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,246,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6495/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,247,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6496/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,247,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6497/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=1,247,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6498/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,247,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6499/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,247,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6500/500000]
+ optim/total_grad_norm=1.234
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,248,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+10/04 [07:05:27] INFO | >> Saving config... checkpoint.py:608
+10/04 [07:06:04] INFO | >> Saving model state... checkpoint.py:796
+10/04 [07:07:18] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [07:08:45] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6501/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,248,192,000
+ throughput/device/tokens_per_second=1,193
+ throughput/device/batches_per_second=0.0497
+[step=6502/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,248,384,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=6503/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,248,576,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=6504/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,248,768,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=6505/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=1,248,960,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=6506/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,249,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6507/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,249,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6508/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=1,249,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6509/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,249,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6510/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,249,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6511/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,250,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6512/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,250,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6513/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,250,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=6514/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,250,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6515/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,250,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6516/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,251,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6517/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,251,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6518/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,251,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6519/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,251,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6520/500000]
+ optim/total_grad_norm=1.895
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=1,251,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6521/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,252,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6522/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,252,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6523/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,252,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6524/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,252,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6525/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,252,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6526/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,252,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6527/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,253,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6528/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,253,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6529/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,253,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6530/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,253,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6531/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,253,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6532/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,254,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6533/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=1,254,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6534/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,254,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6535/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,254,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6536/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=1,254,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6537/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,255,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6538/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=1,255,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6539/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,255,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6540/500000]
+ optim/total_grad_norm=1.079
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,255,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6541/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,255,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6542/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,256,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6543/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,256,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6544/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,256,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6545/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,256,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6546/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,256,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6547/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=1,257,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6548/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,257,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6549/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,257,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6550/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=1,257,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6551/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,257,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6552/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,257,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6553/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,258,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6554/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,258,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6555/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,258,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6556/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,258,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6557/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,258,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6558/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,259,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6559/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=1,259,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6560/500000]
+ optim/total_grad_norm=1.530
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,259,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6561/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=1,259,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6562/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,259,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6563/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,260,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6564/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=1,260,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6565/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,260,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6566/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,260,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6567/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,260,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6568/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,261,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6569/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,261,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6570/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,261,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6571/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,261,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6572/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,261,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6573/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,262,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6574/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,262,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6575/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,262,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6576/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,262,592,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6577/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=1,262,784,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6578/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,262,976,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6579/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,263,168,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6580/500000]
+ optim/total_grad_norm=1.263
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,263,360,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6581/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,263,552,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6582/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,263,744,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6583/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,263,936,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6584/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,264,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6585/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,264,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6586/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,264,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6587/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,264,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6588/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,264,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6589/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,265,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6590/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,265,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6591/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,265,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6592/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,265,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6593/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,265,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6594/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,266,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6595/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=1,266,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6596/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,266,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6597/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,266,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6598/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,266,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6599/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=1,267,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6600/500000]
+ optim/total_grad_norm=2.164
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=1,267,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6601/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,267,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6602/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,267,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6603/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,267,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6604/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=1,267,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6605/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,268,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6606/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=1,268,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6607/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,268,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6608/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=1,268,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6609/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,268,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6610/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,269,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6611/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,269,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6612/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,269,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6613/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=1,269,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6614/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,269,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6615/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,270,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6616/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,270,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6617/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,270,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6618/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,270,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6619/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,270,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6620/500000]
+ optim/total_grad_norm=1.698
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,271,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6621/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,271,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6622/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,271,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6623/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,271,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6624/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=1,271,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6625/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,272,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6626/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=1,272,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6627/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,272,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6628/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,272,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6629/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,272,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6630/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,272,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6631/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,273,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6632/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,273,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6633/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,273,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6634/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,273,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6635/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,273,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6636/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,274,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6637/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,274,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6638/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,274,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6639/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,274,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6640/500000]
+ optim/total_grad_norm=1.193
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,274,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6641/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,275,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6642/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,275,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6643/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,275,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6644/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,275,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6645/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,275,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6646/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,276,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6647/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,276,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6648/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,276,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6649/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,276,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6650/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,276,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6651/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=1,276,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6652/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,277,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6653/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,277,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6654/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,277,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6655/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,277,760,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6656/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,277,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6657/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,278,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6658/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,278,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6659/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,278,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6660/500000]
+ optim/total_grad_norm=1.511
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,278,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6661/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,278,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6662/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,279,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6663/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=1,279,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6664/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,279,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6665/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,279,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6666/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,279,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6667/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,280,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6668/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=1,280,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6669/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,280,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6670/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,280,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6671/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,280,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6672/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=1,281,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6673/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,281,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6674/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,281,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6675/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=1,281,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6676/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,281,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6677/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,281,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6678/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,282,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6679/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,282,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6680/500000]
+ optim/total_grad_norm=1.589
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,282,560,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6681/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,282,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6682/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,282,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6683/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,283,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6684/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,283,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6685/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,283,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6686/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=1,283,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6687/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,283,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6688/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=1,284,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6689/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,284,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6690/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,284,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6691/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,284,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6692/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,284,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6693/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,285,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6694/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,285,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6695/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,285,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6696/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=1,285,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6697/500000]
+ train/ActionNoiseL2Loss=0.1685
+ throughput/total_tokens=1,285,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6698/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,286,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6699/500000]
+ train/ActionNoiseL2Loss=0.1372
+ throughput/total_tokens=1,286,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6700/500000]
+ optim/total_grad_norm=1.473
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,286,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6701/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,286,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6702/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=1,286,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6703/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,286,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6704/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,287,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6705/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=1,287,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6706/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,287,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6707/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=1,287,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6708/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,287,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6709/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,288,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6710/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,288,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6711/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,288,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6712/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,288,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6713/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=1,288,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6714/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,289,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6715/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,289,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6716/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,289,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6717/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,289,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6718/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,289,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6719/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,290,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6720/500000]
+ optim/total_grad_norm=1.246
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,290,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6721/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,290,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6722/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=1,290,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6723/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,290,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6724/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=1,291,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6725/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,291,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6726/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,291,392,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6727/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,291,584,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6728/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,291,776,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6729/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,291,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6730/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,292,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6731/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=1,292,352,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6732/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,292,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6733/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,292,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6734/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,292,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6735/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,293,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6736/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,293,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6737/500000]
+ train/ActionNoiseL2Loss=0.1536
+ throughput/total_tokens=1,293,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6738/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,293,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6739/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,293,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6740/500000]
+ optim/total_grad_norm=1.373
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,294,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6741/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,294,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6742/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,294,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6743/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,294,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6744/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,294,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6745/500000]
+ train/ActionNoiseL2Loss=0.1835
+ throughput/total_tokens=1,295,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6746/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,295,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6747/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,295,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6748/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,295,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6749/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=1,295,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6750/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,296,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6751/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=1,296,192,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6752/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,296,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6753/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,296,576,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6754/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,296,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6755/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,296,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6756/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,297,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6757/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,297,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6758/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,297,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6759/500000]
+ train/ActionNoiseL2Loss=0.1363
+ throughput/total_tokens=1,297,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6760/500000]
+ optim/total_grad_norm=1.455
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,297,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6761/500000]
+ train/ActionNoiseL2Loss=0.2074
+ throughput/total_tokens=1,298,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6762/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,298,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6763/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,298,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6764/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=1,298,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6765/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=1,298,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6766/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=1,299,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6767/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,299,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6768/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,299,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6769/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,299,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6770/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,299,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6771/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,300,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6772/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,300,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6773/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,300,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6774/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,300,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6775/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,300,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6776/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,300,992,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6777/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=1,301,184,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6778/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,301,376,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6779/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=1,301,568,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6780/500000]
+ optim/total_grad_norm=1.339
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,301,760,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6781/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,301,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6782/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,302,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6783/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,302,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6784/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,302,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6785/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=1,302,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6786/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,302,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6787/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,303,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6788/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,303,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6789/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=1,303,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6790/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=1,303,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6791/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=1,303,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6792/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,304,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6793/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,304,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6794/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=1,304,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6795/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,304,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6796/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,304,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6797/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=1,305,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6798/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,305,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6799/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,305,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6800/500000]
+ optim/total_grad_norm=1.613
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=1,305,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6801/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,305,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6802/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,305,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6803/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,306,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6804/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=1,306,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6805/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,306,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6806/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,306,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6807/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,306,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6808/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,307,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6809/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=1,307,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6810/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,307,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6811/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,307,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6812/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,307,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6813/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,308,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6814/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,308,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6815/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,308,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6816/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,308,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6817/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,308,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6818/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,309,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6819/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,309,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6820/500000]
+ optim/total_grad_norm=1.262
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,309,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6821/500000]
+ train/ActionNoiseL2Loss=0.2043
+ throughput/total_tokens=1,309,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6822/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,309,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6823/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,310,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6824/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,310,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6825/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=1,310,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6826/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,310,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6827/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,310,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6828/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,310,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6829/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,311,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6830/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,311,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6831/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=1,311,552,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6832/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,311,744,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6833/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,311,936,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6834/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,312,128,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6835/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,312,320,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6836/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,312,512,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6837/500000]
+ train/ActionNoiseL2Loss=0.1463
+ throughput/total_tokens=1,312,704,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6838/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,312,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6839/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,313,088,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6840/500000]
+ optim/total_grad_norm=1.264
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,313,280,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6841/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,313,472,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6842/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,313,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6843/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,313,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6844/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,314,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6845/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,314,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6846/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,314,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6847/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=1,314,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6848/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,314,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6849/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,315,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6850/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,315,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6851/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,315,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6852/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,315,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6853/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,315,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6854/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,315,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6855/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=1,316,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6856/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,316,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6857/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,316,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6858/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,316,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6859/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=1,316,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6860/500000]
+ optim/total_grad_norm=1.285
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,317,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6861/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,317,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6862/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,317,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6863/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,317,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6864/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,317,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6865/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,318,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6866/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=1,318,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6867/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,318,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6868/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,318,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6869/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,318,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6870/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,319,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6871/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,319,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6872/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,319,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6873/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,319,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6874/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,319,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6875/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=1,320,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6876/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=1,320,192,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6877/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,320,384,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6878/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=1,320,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6879/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,320,768,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6880/500000]
+ optim/total_grad_norm=1.559
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=1,320,960,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6881/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,321,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6882/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,321,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6883/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,321,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6884/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,321,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6885/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,321,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6886/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=1,322,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6887/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,322,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6888/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,322,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6889/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,322,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6890/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,322,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6891/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,323,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6892/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,323,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6893/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,323,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6894/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,323,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6895/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,323,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6896/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,324,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6897/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,324,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6898/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,324,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6899/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,324,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6900/500000]
+ optim/total_grad_norm=1.223
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,324,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6901/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=1,324,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6902/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,325,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6903/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,325,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6904/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,325,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6905/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,325,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6906/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,325,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6907/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,326,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6908/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,326,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6909/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,326,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6910/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,326,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6911/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,326,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6912/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,327,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6913/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,327,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6914/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,327,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6915/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,327,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6916/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=1,327,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6917/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,328,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6918/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,328,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6919/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,328,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6920/500000]
+ optim/total_grad_norm=1.428
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,328,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6921/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,328,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6922/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,329,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6923/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,329,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6924/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,329,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6925/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,329,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6926/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,329,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6927/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,329,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6928/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=1,330,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6929/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,330,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6930/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,330,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6931/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,330,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6932/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,330,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6933/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,331,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6934/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,331,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6935/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,331,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6936/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,331,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6937/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,331,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6938/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,332,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6939/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,332,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6940/500000]
+ optim/total_grad_norm=1.088
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,332,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6941/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,332,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6942/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=1,332,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6943/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,333,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6944/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,333,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6945/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,333,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6946/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,333,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6947/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,333,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6948/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,334,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6949/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,334,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6950/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,334,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6951/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=1,334,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6952/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,334,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6953/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,334,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6954/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,335,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6955/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,335,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6956/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,335,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6957/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,335,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6958/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,335,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6959/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,336,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6960/500000]
+ optim/total_grad_norm=1.065
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,336,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=6961/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,336,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6962/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,336,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6963/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,336,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6964/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=1,337,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6965/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,337,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6966/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,337,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6967/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,337,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6968/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=1,337,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6969/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,338,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6970/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=1,338,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6971/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,338,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6972/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,338,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6973/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,338,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6974/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,339,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6975/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,339,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6976/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,339,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6977/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,339,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6978/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,339,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6979/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,339,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6980/500000]
+ optim/total_grad_norm=0.8997
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,340,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6981/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,340,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6982/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,340,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6983/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,340,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6984/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,340,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6985/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,341,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6986/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,341,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6987/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,341,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6988/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,341,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6989/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,341,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6990/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,342,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=6991/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,342,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6992/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,342,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6993/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=1,342,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6994/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,342,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6995/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,343,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6996/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,343,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6997/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,343,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6998/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,343,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6999/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=1,343,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7000/500000]
+ optim/total_grad_norm=1.555
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,344,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/04 [10:02:16] INFO | >> Saving config... checkpoint.py:608
+10/04 [10:03:12] INFO | >> Saving model state... checkpoint.py:796
+10/04 [10:04:26] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [10:05:59] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7001/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=1,344,192,000
+ throughput/device/tokens_per_second=1,195
+ throughput/device/batches_per_second=0.0498
+[step=7002/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,344,384,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=7003/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,344,576,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0488
+[step=7004/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,344,768,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=7005/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,344,960,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=7006/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,345,152,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=7007/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,345,344,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=7008/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,345,536,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=7009/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,345,728,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=7010/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=1,345,920,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=7011/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=1,346,112,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=7012/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,346,304,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=7013/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,346,496,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=7014/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,346,688,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=7015/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=1,346,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7016/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,347,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7017/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=1,347,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7018/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,347,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7019/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,347,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7020/500000]
+ optim/total_grad_norm=1.240
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,347,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7021/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,348,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7022/500000]
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=1,348,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7023/500000]
+ train/ActionNoiseL2Loss=0.1424
+ throughput/total_tokens=1,348,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7024/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,348,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7025/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,348,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7026/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,348,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7027/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,349,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7028/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,349,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7029/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,349,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7030/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,349,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7031/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,349,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7032/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,350,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7033/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,350,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7034/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,350,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7035/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=1,350,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7036/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,350,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7037/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,351,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7038/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,351,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7039/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,351,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7040/500000]
+ optim/total_grad_norm=1.978
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,351,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7041/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=1,351,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7042/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=1,352,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7043/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,352,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7044/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,352,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7045/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,352,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7046/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,352,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7047/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,353,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7048/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,353,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7049/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,353,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7050/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=1,353,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7051/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,353,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7052/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=1,353,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7053/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,354,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7054/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,354,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7055/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,354,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7056/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=1,354,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7057/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,354,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7058/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,355,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7059/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,355,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7060/500000]
+ optim/total_grad_norm=1.831
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,355,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=7061/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=1,355,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7062/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,355,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7063/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,356,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7064/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,356,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7065/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,356,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7066/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,356,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7067/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,356,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7068/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,357,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7069/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=1,357,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7070/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,357,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7071/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,357,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7072/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,357,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7073/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,358,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7074/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,358,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7075/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,358,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7076/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,358,592,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7077/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,358,784,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7078/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,358,976,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7079/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,359,168,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7080/500000]
+ optim/total_grad_norm=1.668
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,359,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7081/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=1,359,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7082/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,359,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7083/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=1,359,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7084/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,360,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7085/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,360,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7086/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=1,360,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7087/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,360,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7088/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,360,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7089/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,361,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7090/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=1,361,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7091/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,361,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7092/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,361,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7093/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,361,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7094/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,362,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7095/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,362,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7096/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,362,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7097/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,362,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7098/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,362,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7099/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=1,363,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7100/500000]
+ optim/total_grad_norm=1.376
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,363,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7101/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,363,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7102/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=1,363,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7103/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,363,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7104/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,363,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7105/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,364,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7106/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,364,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7107/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,364,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7108/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,364,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7109/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=1,364,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7110/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,365,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=7111/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,365,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7112/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,365,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7113/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,365,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7114/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=1,365,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7115/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,366,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7116/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,366,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7117/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,366,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7118/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,366,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7119/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,366,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7120/500000]
+ optim/total_grad_norm=1.469
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=1,367,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7121/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,367,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7122/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,367,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7123/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=1,367,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7124/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,367,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7125/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,368,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7126/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,368,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7127/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,368,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7128/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,368,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7129/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,368,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7130/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,368,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7131/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,369,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7132/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,369,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7133/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,369,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7134/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,369,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7135/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,369,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7136/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=1,370,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7137/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,370,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7138/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,370,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7139/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,370,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7140/500000]
+ optim/total_grad_norm=1.813
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=1,370,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7141/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,371,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7142/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,371,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7143/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,371,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7144/500000]
+ train/ActionNoiseL2Loss=0.1356
+ throughput/total_tokens=1,371,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7145/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,371,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7146/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,372,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7147/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,372,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7148/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=1,372,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7149/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,372,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7150/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,372,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7151/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,372,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7152/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,373,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7153/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=1,373,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7154/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,373,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7155/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,373,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7156/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,373,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7157/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,374,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7158/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,374,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7159/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,374,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7160/500000]
+ optim/total_grad_norm=1.167
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,374,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7161/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=1,374,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7162/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,375,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7163/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,375,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7164/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,375,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7165/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,375,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7166/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,375,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7167/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,376,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7168/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,376,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7169/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=1,376,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7170/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,376,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7171/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,376,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7172/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=1,377,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7173/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,377,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7174/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,377,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7175/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=1,377,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7176/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,377,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7177/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,377,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7178/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,378,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7179/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,378,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7180/500000]
+ optim/total_grad_norm=0.9939
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,378,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7181/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,378,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7182/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,378,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7183/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,379,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7184/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,379,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7185/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,379,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7186/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=1,379,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7187/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,379,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7188/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=1,380,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7189/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,380,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7190/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,380,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7191/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,380,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7192/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,380,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7193/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=1,381,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7194/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,381,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7195/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,381,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7196/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,381,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7197/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,381,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7198/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,382,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7199/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,382,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7200/500000]
+ optim/total_grad_norm=1.828
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=1,382,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7201/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=1,382,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7202/500000]
+ train/ActionNoiseL2Loss=0.1503
+ throughput/total_tokens=1,382,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7203/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,382,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7204/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,383,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7205/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,383,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7206/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,383,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7207/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,383,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7208/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,383,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7209/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,384,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7210/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,384,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=7211/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,384,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7212/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,384,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7213/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,384,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7214/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,385,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7215/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=1,385,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7216/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,385,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7217/500000]
+ train/ActionNoiseL2Loss=0.1161
+ throughput/total_tokens=1,385,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7218/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,385,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7219/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,386,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7220/500000]
+ optim/total_grad_norm=1.854
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,386,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7221/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,386,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7222/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,386,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7223/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,386,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7224/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,387,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7225/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=1,387,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7226/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=1,387,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7227/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,387,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7228/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,387,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7229/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,387,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7230/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,388,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7231/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,388,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7232/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,388,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7233/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,388,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7234/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,388,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7235/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,389,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7236/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,389,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7237/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,389,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7238/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=1,389,696,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7239/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=1,389,888,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7240/500000]
+ optim/total_grad_norm=1.211
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,390,080,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7241/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,390,272,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7242/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,390,464,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7243/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,390,656,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7244/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,390,848,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7245/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,391,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7246/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,391,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7247/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,391,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7248/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,391,616,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7249/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,391,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7250/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,392,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7251/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,392,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7252/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,392,384,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7253/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,392,576,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7254/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,392,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7255/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,392,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7256/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,393,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7257/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,393,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7258/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,393,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7259/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,393,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7260/500000]
+ optim/total_grad_norm=1.483
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=1,393,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7261/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,394,112,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7262/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,394,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7263/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=1,394,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7264/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,394,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7265/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,394,880,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7266/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,395,072,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7267/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,395,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7268/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,395,456,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7269/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,395,648,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7270/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,395,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7271/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,396,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7272/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,396,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7273/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,396,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7274/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=1,396,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7275/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,396,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7276/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=1,396,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7277/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=1,397,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7278/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,397,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7279/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,397,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7280/500000]
+ optim/total_grad_norm=1.172
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,397,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7281/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=1,397,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7282/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,398,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7283/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,398,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7284/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,398,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7285/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,398,720,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7286/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,398,912,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7287/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,399,104,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7288/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=1,399,296,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7289/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,399,488,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7290/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,399,680,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7291/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,399,872,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7292/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=1,400,064,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7293/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,400,256,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7294/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,400,448,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7295/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=1,400,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7296/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,400,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7297/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,401,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7298/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,401,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7299/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,401,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7300/500000]
+ optim/total_grad_norm=0.9868
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,401,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7301/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,401,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7302/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=1,401,984,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7303/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,402,176,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7304/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=1,402,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7305/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,402,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7306/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,402,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7307/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,402,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7308/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,403,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7309/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=1,403,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7310/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,403,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7311/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,403,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7312/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,403,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7313/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=1,404,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7314/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,404,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7315/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,404,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7316/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,404,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7317/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=1,404,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7318/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,405,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7319/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,405,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7320/500000]
+ optim/total_grad_norm=1.711
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=1,405,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7321/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,405,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7322/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=1,405,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7323/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,406,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7324/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,406,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7325/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,406,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7326/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,406,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7327/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,406,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7328/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,406,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7329/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,407,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7330/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=1,407,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7331/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,407,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7332/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,407,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7333/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,407,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7334/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,408,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7335/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,408,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7336/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,408,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7337/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,408,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7338/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,408,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7339/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,409,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7340/500000]
+ optim/total_grad_norm=1.226
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,409,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7341/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,409,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7342/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,409,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7343/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,409,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7344/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,410,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7345/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,410,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7346/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,410,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7347/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,410,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7348/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,410,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7349/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,411,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7350/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,411,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7351/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,411,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7352/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,411,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7353/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,411,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7354/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,411,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7355/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,412,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7356/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,412,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7357/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,412,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7358/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,412,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7359/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,412,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7360/500000]
+ optim/total_grad_norm=1.268
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,413,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7361/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,413,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7362/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,413,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7363/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,413,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7364/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,413,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7365/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,414,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7366/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,414,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7367/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,414,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7368/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,414,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7369/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=1,414,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7370/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,415,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7371/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,415,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7372/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,415,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7373/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=1,415,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7374/500000]
+ train/ActionNoiseL2Loss=0.1295
+ throughput/total_tokens=1,415,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7375/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,416,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7376/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,416,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7377/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,416,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7378/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,416,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7379/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,416,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7380/500000]
+ optim/total_grad_norm=1.347
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,416,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7381/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,417,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7382/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,417,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7383/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,417,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7384/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,417,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7385/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,417,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7386/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,418,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7387/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,418,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7388/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=1,418,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7389/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,418,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7390/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=1,418,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7391/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,419,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7392/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,419,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7393/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,419,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7394/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,419,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7395/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,419,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7396/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=1,420,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7397/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,420,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7398/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,420,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7399/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,420,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7400/500000]
+ optim/total_grad_norm=0.9301
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,420,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7401/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,420,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7402/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,421,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7403/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,421,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7404/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=1,421,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7405/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,421,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7406/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,421,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7407/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,422,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7408/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,422,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7409/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,422,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7410/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,422,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7411/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,422,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7412/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,423,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7413/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,423,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7414/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,423,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7415/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,423,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7416/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,423,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7417/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=1,424,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7418/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=1,424,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7419/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,424,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7420/500000]
+ optim/total_grad_norm=1.051
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,424,640,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7421/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,424,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7422/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,425,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7423/500000]
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=1,425,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7424/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,425,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7425/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,425,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7426/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,425,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7427/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,425,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7428/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,426,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7429/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,426,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7430/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,426,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7431/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=1,426,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7432/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,426,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7433/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,427,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7434/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=1,427,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7435/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,427,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7436/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,427,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7437/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,427,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7438/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,428,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7439/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,428,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7440/500000]
+ optim/total_grad_norm=0.7841
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,428,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7441/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,428,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7442/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,428,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7443/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,429,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7444/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=1,429,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7445/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,429,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7446/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,429,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7447/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,429,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7448/500000]
+ train/ActionNoiseL2Loss=0.1589
+ throughput/total_tokens=1,430,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7449/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,430,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7450/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,430,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7451/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,430,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7452/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,430,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7453/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=1,430,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7454/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,431,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7455/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,431,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7456/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,431,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7457/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,431,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7458/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,431,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7459/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,432,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7460/500000]
+ optim/total_grad_norm=1.520
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,432,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7461/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=1,432,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7462/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,432,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7463/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,432,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7464/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,433,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7465/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,433,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7466/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=1,433,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7467/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,433,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7468/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,433,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7469/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,434,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7470/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,434,240,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7471/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,434,432,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7472/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,434,624,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7473/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,434,816,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7474/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,435,008,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7475/500000]
+ train/ActionNoiseL2Loss=0.1549
+ throughput/total_tokens=1,435,200,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7476/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,435,392,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7477/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,435,584,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7478/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,435,776,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7479/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,435,968,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7480/500000]
+ optim/total_grad_norm=1.679
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,436,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7481/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,436,352,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7482/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,436,544,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7483/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,436,736,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7484/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,436,928,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7485/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=1,437,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7486/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,437,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7487/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,437,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7488/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,437,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7489/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,437,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7490/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,438,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7491/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,438,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7492/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,438,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7493/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,438,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7494/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,438,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7495/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,439,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7496/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,439,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7497/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,439,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7498/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,439,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7499/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,439,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7500/500000]
+ optim/total_grad_norm=1.111
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,440,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/04 [12:59:28] INFO | >> Saving config... checkpoint.py:608
+10/04 [13:00:24] INFO | >> Saving model state... checkpoint.py:796
+10/04 [13:01:38] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [13:03:10] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7501/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,440,192,000
+ throughput/device/tokens_per_second=1,197
+ throughput/device/batches_per_second=0.0499
+[step=7502/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,440,384,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=7503/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,440,576,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=7504/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,440,768,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=7505/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,440,960,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=7506/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,441,152,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=7507/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,441,344,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=7508/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=1,441,536,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=7509/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,441,728,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=7510/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=1,441,920,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=7511/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,442,112,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=7512/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,442,304,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=7513/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,442,496,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=7514/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,442,688,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=7515/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=1,442,880,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=7516/500000]
+ train/ActionNoiseL2Loss=0.1473
+ throughput/total_tokens=1,443,072,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=7517/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=1,443,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7518/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,443,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7519/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,443,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7520/500000]
+ optim/total_grad_norm=1.505
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,443,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7521/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,444,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7522/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,444,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7523/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,444,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7524/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,444,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7525/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,444,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7526/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,444,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7527/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,445,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7528/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=1,445,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7529/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,445,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7530/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,445,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7531/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,445,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7532/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,446,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7533/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,446,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7534/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,446,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7535/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,446,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7536/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,446,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7537/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,447,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7538/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=1,447,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7539/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,447,488,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7540/500000]
+ optim/total_grad_norm=1.271
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,447,680,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7541/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,447,872,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7542/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,448,064,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7543/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,448,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7544/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,448,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7545/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,448,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7546/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,448,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7547/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,449,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7548/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,449,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7549/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,449,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7550/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,449,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7551/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,449,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7552/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,449,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7553/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=1,450,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7554/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,450,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7555/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=1,450,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7556/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,450,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7557/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,450,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7558/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,451,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7559/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,451,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7560/500000]
+ optim/total_grad_norm=1.053
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,451,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7561/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,451,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7562/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,451,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7563/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,452,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7564/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,452,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7565/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=1,452,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7566/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,452,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7567/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,452,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7568/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=1,453,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7569/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,453,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7570/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,453,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7571/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,453,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7572/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=1,453,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7573/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,454,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7574/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,454,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7575/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,454,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7576/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,454,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7577/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=1,454,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7578/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=1,454,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7579/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,455,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7580/500000]
+ optim/total_grad_norm=1.769
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,455,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7581/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,455,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7582/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,455,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7583/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,455,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7584/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,456,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7585/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,456,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7586/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,456,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7587/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,456,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7588/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,456,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7589/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,457,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7590/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,457,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7591/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,457,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7592/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,457,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7593/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,457,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7594/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,458,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7595/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,458,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7596/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,458,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7597/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=1,458,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7598/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,458,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7599/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,459,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7600/500000]
+ optim/total_grad_norm=2.346
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=1,459,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7601/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,459,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7602/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,459,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7603/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,459,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7604/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,459,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7605/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,460,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7606/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,460,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7607/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=1,460,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7608/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,460,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7609/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,460,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7610/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,461,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7611/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,461,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7612/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,461,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7613/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,461,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7614/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,461,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7615/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=1,462,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7616/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,462,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7617/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,462,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7618/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,462,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7619/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=1,462,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7620/500000]
+ optim/total_grad_norm=1.406
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,463,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7621/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,463,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7622/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,463,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7623/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,463,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7624/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,463,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7625/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,464,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7626/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,464,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7627/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,464,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7628/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,464,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7629/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=1,464,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7630/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,464,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7631/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,465,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7632/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,465,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7633/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,465,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7634/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,465,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7635/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,465,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7636/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,466,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7637/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=1,466,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7638/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,466,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7639/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=1,466,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7640/500000]
+ optim/total_grad_norm=1.933
+ train/ActionNoiseL2Loss=0.1240
+ throughput/total_tokens=1,466,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7641/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,467,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7642/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,467,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7643/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,467,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7644/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,467,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7645/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,467,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7646/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,468,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7647/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,468,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7648/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,468,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7649/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=1,468,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7650/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,468,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7651/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,468,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7652/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=1,469,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7653/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,469,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7654/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,469,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7655/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,469,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7656/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=1,469,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7657/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,470,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7658/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,470,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7659/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,470,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7660/500000]
+ optim/total_grad_norm=1.497
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,470,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=7661/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,470,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7662/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,471,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7663/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,471,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7664/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,471,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7665/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,471,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7666/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,471,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7667/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,472,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7668/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=1,472,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7669/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=1,472,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7670/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,472,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7671/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,472,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7672/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,473,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7673/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,473,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7674/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,473,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7675/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,473,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7676/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,473,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7677/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,473,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7678/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=1,474,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7679/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,474,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7680/500000]
+ optim/total_grad_norm=0.8452
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,474,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7681/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,474,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7682/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,474,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7683/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,475,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7684/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=1,475,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7685/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=1,475,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7686/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,475,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7687/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,475,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7688/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,476,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7689/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,476,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7690/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,476,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7691/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,476,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7692/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,476,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7693/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,477,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7694/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,477,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7695/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,477,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7696/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,477,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7697/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,477,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7698/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,478,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7699/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,478,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7700/500000]
+ optim/total_grad_norm=1.198
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,478,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7701/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,478,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7702/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,478,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7703/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,478,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7704/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,479,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7705/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,479,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7706/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,479,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7707/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,479,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7708/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,479,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7709/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,480,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7710/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,480,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=7711/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,480,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7712/500000]
+ train/ActionNoiseL2Loss=0.1455
+ throughput/total_tokens=1,480,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7713/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,480,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7714/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,481,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7715/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,481,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7716/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,481,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7717/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,481,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7718/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=1,481,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7719/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,482,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7720/500000]
+ optim/total_grad_norm=1.690
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,482,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7721/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,482,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7722/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,482,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7723/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,482,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7724/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,483,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7725/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,483,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7726/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,483,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7727/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,483,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7728/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,483,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7729/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=1,483,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7730/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,484,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7731/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,484,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7732/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,484,544,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7733/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,484,736,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7734/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,484,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7735/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=1,485,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7736/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,485,312,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7737/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,485,504,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7738/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,485,696,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7739/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,485,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7740/500000]
+ optim/total_grad_norm=1.234
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=1,486,080,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7741/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,486,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7742/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,486,464,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7743/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,486,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7744/500000]
+ train/ActionNoiseL2Loss=0.1388
+ throughput/total_tokens=1,486,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7745/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,487,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7746/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,487,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7747/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=1,487,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7748/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,487,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7749/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,487,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7750/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,488,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7751/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,488,192,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=7752/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,488,384,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=7753/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,488,576,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0473
+[step=7754/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,488,768,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=7755/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,488,960,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=7756/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=1,489,152,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=7757/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,489,344,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=7758/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,489,536,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=7759/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,489,728,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=7760/500000]
+ optim/total_grad_norm=1.302
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,489,920,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+ System/Peak GPU Memory (MB)=46,467
+[step=7761/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,490,112,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=7762/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,490,304,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=7763/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,490,496,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=7764/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,490,688,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=7765/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,490,880,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=7766/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,491,072,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=7767/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,491,264,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=7768/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,491,456,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=7769/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,491,648,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=7770/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,491,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7771/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,492,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7772/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,492,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7773/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,492,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7774/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,492,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7775/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,492,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7776/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=1,492,992,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7777/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,493,184,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7778/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,493,376,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7779/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,493,568,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7780/500000]
+ optim/total_grad_norm=1.602
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,493,760,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7781/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,493,952,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7782/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=1,494,144,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7783/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,494,336,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7784/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,494,528,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7785/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,494,720,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7786/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=1,494,912,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7787/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=1,495,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7788/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=1,495,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7789/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=1,495,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7790/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,495,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7791/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,495,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7792/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,496,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7793/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,496,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7794/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,496,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7795/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=1,496,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7796/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,496,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7797/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,497,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7798/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,497,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7799/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,497,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7800/500000]
+ optim/total_grad_norm=1.213
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,497,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7801/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,497,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7802/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,497,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7803/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,498,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7804/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,498,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7805/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=1,498,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7806/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,498,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7807/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,498,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7808/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,499,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7809/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,499,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7810/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,499,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7811/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,499,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7812/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=1,499,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7813/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,500,096,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7814/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,500,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7815/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,500,480,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7816/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,500,672,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7817/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,500,864,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7818/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=1,501,056,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7819/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,501,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7820/500000]
+ optim/total_grad_norm=1.191
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,501,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7821/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=1,501,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7822/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,501,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7823/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,502,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7824/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,502,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7825/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,502,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7826/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,502,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7827/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,502,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7828/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,502,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7829/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,503,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7830/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,503,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7831/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,503,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7832/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,503,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7833/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=1,503,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7834/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,504,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7835/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,504,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7836/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,504,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7837/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,504,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7838/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,504,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7839/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,505,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7840/500000]
+ optim/total_grad_norm=1.515
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,505,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7841/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,505,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7842/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,505,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7843/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,505,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7844/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,506,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7845/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,506,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7846/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,506,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7847/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,506,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7848/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,506,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7849/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,507,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7850/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,507,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7851/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,507,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7852/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,507,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7853/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=1,507,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7854/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,507,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7855/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,508,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7856/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,508,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7857/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,508,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7858/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,508,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7859/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,508,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7860/500000]
+ optim/total_grad_norm=1.396
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,509,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7861/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,509,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7862/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,509,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7863/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,509,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7864/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=1,509,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7865/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,510,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7866/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,510,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7867/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,510,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7868/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,510,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7869/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,510,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7870/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,511,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7871/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,511,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7872/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,511,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7873/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,511,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7874/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,511,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7875/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,512,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7876/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,512,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7877/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,512,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7878/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,512,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7879/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,512,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7880/500000]
+ optim/total_grad_norm=1.303
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,512,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7881/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,513,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7882/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,513,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7883/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,513,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7884/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,513,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7885/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,513,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7886/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=1,514,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7887/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,514,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7888/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,514,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7889/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=1,514,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7890/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,514,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7891/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=1,515,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7892/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=1,515,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7893/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,515,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7894/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,515,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7895/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,515,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7896/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,516,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7897/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=1,516,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7898/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,516,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7899/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,516,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7900/500000]
+ optim/total_grad_norm=1.496
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,516,800,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7901/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,516,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7902/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=1,517,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7903/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=1,517,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7904/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=1,517,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7905/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,517,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7906/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,517,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7907/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,518,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7908/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,518,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=7909/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=1,518,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7910/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,518,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=7911/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,518,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7912/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,519,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7913/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,519,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7914/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,519,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7915/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,519,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7916/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,519,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7917/500000]
+ train/ActionNoiseL2Loss=0.1240
+ throughput/total_tokens=1,520,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7918/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,520,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7919/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,520,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7920/500000]
+ optim/total_grad_norm=1.125
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,520,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=7921/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,520,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7922/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,521,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=7923/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,521,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=7924/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,521,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7925/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,521,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7926/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=1,521,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7927/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,521,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7928/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,522,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7929/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=1,522,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7930/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,522,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7931/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,522,752,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7932/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,522,944,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7933/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,523,136,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7934/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=1,523,328,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7935/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,523,520,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7936/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,523,712,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7937/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,523,904,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7938/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,524,096,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7939/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,524,288,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7940/500000]
+ optim/total_grad_norm=1.510
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,524,480,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7941/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,524,672,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7942/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,524,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7943/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,525,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7944/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,525,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7945/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,525,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7946/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,525,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7947/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,525,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7948/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,526,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7949/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,526,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7950/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,526,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7951/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,526,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7952/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,526,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7953/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,526,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7954/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,527,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7955/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,527,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7956/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,527,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7957/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,527,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7958/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,527,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7959/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,528,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7960/500000]
+ optim/total_grad_norm=1.128
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=1,528,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=7961/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,528,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7962/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,528,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7963/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,528,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7964/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=1,529,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7965/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,529,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7966/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=1,529,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7967/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=1,529,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7968/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,529,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7969/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,530,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7970/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,530,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7971/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,530,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7972/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,530,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7973/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,530,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7974/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,531,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7975/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,531,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7976/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,531,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7977/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,531,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7978/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,531,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7979/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,531,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7980/500000]
+ optim/total_grad_norm=1.370
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,532,160,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7981/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,532,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7982/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,532,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7983/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,532,736,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7984/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,532,928,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7985/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,533,120,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7986/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,533,312,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7987/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,533,504,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7988/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,533,696,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7989/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,533,888,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7990/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=1,534,080,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=7991/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,534,272,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7992/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=1,534,464,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7993/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,534,656,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7994/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,534,848,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7995/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,535,040,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7996/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,535,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7997/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,535,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7998/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,535,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7999/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,535,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8000/500000]
+ optim/total_grad_norm=1.406
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,536,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/04 [15:56:49] INFO | >> Saving config... checkpoint.py:608
+10/04 [15:57:38] INFO | >> Saving model state... checkpoint.py:796
+10/04 [15:58:52] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [16:00:25] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8001/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,536,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8002/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,536,384,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=8003/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,536,576,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=8004/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,536,768,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=8005/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,536,960,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=8006/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,537,152,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=8007/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,537,344,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=8008/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,537,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8009/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,537,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8010/500000]
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=1,537,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8011/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,538,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8012/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,538,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8013/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,538,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8014/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,538,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8015/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,538,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8016/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,539,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8017/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,539,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8018/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,539,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8019/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,539,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8020/500000]
+ optim/total_grad_norm=1.234
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=1,539,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8021/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,540,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8022/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,540,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8023/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,540,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8024/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,540,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8025/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,540,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8026/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,540,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8027/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,541,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8028/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,541,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8029/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,541,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8030/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,541,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8031/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,541,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8032/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,542,144,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8033/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,542,336,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8034/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,542,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8035/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,542,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8036/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,542,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8037/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,543,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8038/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,543,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8039/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,543,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8040/500000]
+ optim/total_grad_norm=1.762
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,543,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8041/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,543,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8042/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,544,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8043/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,544,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8044/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,544,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8045/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,544,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8046/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=1,544,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8047/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,545,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8048/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,545,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8049/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,545,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8050/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,545,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8051/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,545,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8052/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,545,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8053/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,546,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8054/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,546,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8055/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,546,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8056/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=1,546,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8057/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,546,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8058/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,547,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8059/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,547,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8060/500000]
+ optim/total_grad_norm=1.394
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,547,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8061/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,547,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8062/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,547,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8063/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,548,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8064/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,548,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8065/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,548,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8066/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,548,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8067/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,548,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8068/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,549,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8069/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,549,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8070/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=1,549,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8071/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,549,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8072/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,549,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8073/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,550,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8074/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=1,550,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8075/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,550,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8076/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,550,592,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8077/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=1,550,784,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8078/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,550,976,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8079/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,551,168,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8080/500000]
+ optim/total_grad_norm=0.9972
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,551,360,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8081/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,551,552,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8082/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=1,551,744,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8083/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,551,936,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8084/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,552,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8085/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,552,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8086/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,552,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8087/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,552,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8088/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,552,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8089/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,553,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8090/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,553,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8091/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,553,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8092/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,553,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8093/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,553,856,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8094/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,554,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8095/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,554,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8096/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,554,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8097/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,554,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8098/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=1,554,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8099/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,555,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8100/500000]
+ optim/total_grad_norm=1.222
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,555,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8101/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,555,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8102/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,555,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8103/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,555,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8104/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=1,555,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8105/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,556,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8106/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,556,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8107/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,556,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8108/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,556,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8109/500000]
+ train/ActionNoiseL2Loss=0.1191
+ throughput/total_tokens=1,556,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8110/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,557,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8111/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,557,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8112/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,557,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8113/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,557,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8114/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,557,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8115/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,558,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8116/500000]
+ train/ActionNoiseL2Loss=0.1522
+ throughput/total_tokens=1,558,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8117/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,558,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8118/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,558,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8119/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,558,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8120/500000]
+ optim/total_grad_norm=1.394
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,559,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8121/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,559,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8122/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,559,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8123/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,559,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8124/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,559,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8125/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,560,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8126/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,560,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8127/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,560,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8128/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,560,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8129/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,560,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8130/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,560,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8131/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,561,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8132/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=1,561,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8133/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,561,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8134/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,561,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8135/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,561,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8136/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,562,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8137/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,562,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8138/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,562,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8139/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,562,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8140/500000]
+ optim/total_grad_norm=1.101
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,562,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8141/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,563,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8142/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,563,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8143/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,563,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8144/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=1,563,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8145/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,563,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8146/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,564,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8147/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,564,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8148/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,564,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8149/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,564,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8150/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,564,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8151/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,564,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8152/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=1,565,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8153/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,565,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8154/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,565,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8155/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,565,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8156/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,565,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8157/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=1,566,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8158/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,566,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8159/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,566,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8160/500000]
+ optim/total_grad_norm=1.790
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=1,566,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8161/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,566,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8162/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,567,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8163/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,567,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8164/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,567,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8165/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,567,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8166/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,567,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8167/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,568,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8168/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,568,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8169/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,568,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8170/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,568,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8171/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,568,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8172/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,569,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8173/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=1,569,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8174/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,569,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8175/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,569,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8176/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,569,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8177/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,569,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8178/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,570,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8179/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,570,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8180/500000]
+ optim/total_grad_norm=1.202
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,570,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8181/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,570,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8182/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,570,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8183/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,571,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8184/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=1,571,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8185/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,571,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8186/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,571,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8187/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,571,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8188/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,572,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8189/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,572,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8190/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,572,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8191/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,572,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8192/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,572,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8193/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,573,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8194/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,573,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8195/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,573,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8196/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,573,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8197/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,573,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8198/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,574,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8199/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,574,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8200/500000]
+ optim/total_grad_norm=1.197
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,574,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8201/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,574,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8202/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=1,574,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8203/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,574,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8204/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,575,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8205/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,575,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8206/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,575,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8207/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,575,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8208/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,575,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8209/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,576,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8210/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,576,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8211/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,576,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8212/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,576,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8213/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,576,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8214/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,577,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8215/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,577,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8216/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,577,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8217/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,577,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8218/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,577,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8219/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,578,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8220/500000]
+ optim/total_grad_norm=1.196
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,578,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8221/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,578,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8222/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,578,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8223/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,578,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8224/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=1,579,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8225/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,579,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8226/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=1,579,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8227/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,579,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8228/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,579,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8229/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,579,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8230/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,580,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8231/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,580,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8232/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,580,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8233/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,580,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8234/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,580,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8235/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,581,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8236/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,581,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8237/500000]
+ train/ActionNoiseL2Loss=0.1746
+ throughput/total_tokens=1,581,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8238/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,581,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8239/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,581,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8240/500000]
+ optim/total_grad_norm=1.557
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,582,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8241/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,582,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8242/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,582,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8243/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,582,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8244/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,582,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8245/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,583,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8246/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=1,583,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8247/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,583,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8248/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,583,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8249/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,583,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8250/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=1,584,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8251/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,584,192,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8252/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,584,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8253/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,584,576,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8254/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,584,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8255/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,584,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8256/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,585,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8257/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,585,344,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8258/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,585,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8259/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,585,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8260/500000]
+ optim/total_grad_norm=1.093
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,585,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8261/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,586,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8262/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,586,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8263/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,586,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8264/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,586,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8265/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,586,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8266/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,587,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8267/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,587,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8268/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,587,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8269/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,587,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8270/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,587,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8271/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,588,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8272/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,588,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8273/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,588,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8274/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,588,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8275/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,588,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8276/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,588,992,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8277/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,589,184,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8278/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,589,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8279/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,589,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8280/500000]
+ optim/total_grad_norm=0.7780
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,589,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8281/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,589,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8282/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=1,590,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8283/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,590,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8284/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,590,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8285/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,590,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8286/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,590,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8287/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,591,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8288/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,591,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8289/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,591,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8290/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=1,591,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8291/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,591,872,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8292/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,592,064,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8293/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,592,256,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8294/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,592,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8295/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,592,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8296/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,592,832,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8297/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,593,024,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8298/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,593,216,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8299/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,593,408,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8300/500000]
+ optim/total_grad_norm=1.346
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,593,600,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8301/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,593,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8302/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,593,984,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8303/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,594,176,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8304/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,594,368,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8305/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,594,560,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8306/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=1,594,752,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8307/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,594,944,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8308/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,595,136,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8309/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,595,328,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8310/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,595,520,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8311/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=1,595,712,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8312/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,595,904,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8313/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=1,596,096,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8314/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,596,288,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8315/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,596,480,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8316/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,596,672,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8317/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,596,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8318/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,597,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8319/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,597,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8320/500000]
+ optim/total_grad_norm=1.671
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=1,597,440,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8321/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,597,632,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8322/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,597,824,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8323/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,598,016,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8324/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,598,208,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8325/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,598,400,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8326/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,598,592,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8327/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,598,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8328/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,598,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8329/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,599,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8330/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,599,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8331/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,599,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8332/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,599,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8333/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,599,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8334/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,600,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8335/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,600,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8336/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,600,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8337/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,600,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8338/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,600,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8339/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,601,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8340/500000]
+ optim/total_grad_norm=1.104
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,601,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8341/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,601,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8342/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,601,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8343/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,601,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8344/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,602,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8345/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=1,602,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8346/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,602,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8347/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,602,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8348/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,602,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8349/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,603,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8350/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,603,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8351/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,603,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8352/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,603,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8353/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=1,603,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8354/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,603,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8355/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,604,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8356/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,604,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8357/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,604,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8358/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,604,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8359/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,604,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8360/500000]
+ optim/total_grad_norm=1.586
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=1,605,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8361/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,605,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8362/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=1,605,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8363/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,605,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8364/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,605,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8365/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,606,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8366/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,606,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8367/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,606,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8368/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,606,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8369/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,606,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8370/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,607,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8371/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,607,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8372/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=1,607,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8373/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=1,607,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8374/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=1,607,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8375/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,608,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8376/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,608,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8377/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=1,608,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8378/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,608,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8379/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=1,608,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8380/500000]
+ optim/total_grad_norm=1.603
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,608,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8381/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,609,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8382/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=1,609,344,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8383/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,609,536,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8384/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,609,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8385/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,609,920,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8386/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=1,610,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8387/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,610,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8388/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,610,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8389/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,610,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8390/500000]
+ train/ActionNoiseL2Loss=0.1891
+ throughput/total_tokens=1,610,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8391/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,611,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8392/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,611,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8393/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,611,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8394/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=1,611,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8395/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,611,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8396/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,612,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8397/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,612,224,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8398/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,612,416,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8399/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,612,608,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8400/500000]
+ optim/total_grad_norm=1.751
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=1,612,800,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8401/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,612,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8402/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,613,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8403/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,613,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8404/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,613,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8405/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,613,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8406/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,613,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8407/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,614,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8408/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,614,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8409/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=1,614,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8410/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,614,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8411/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,614,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8412/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,615,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8413/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,615,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8414/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,615,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8415/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,615,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8416/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,615,872,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8417/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,616,064,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8418/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,616,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8419/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,616,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8420/500000]
+ optim/total_grad_norm=0.9718
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,616,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8421/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,616,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8422/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,617,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8423/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,617,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8424/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,617,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8425/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,617,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8426/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,617,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8427/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,617,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8428/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,618,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8429/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,618,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8430/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,618,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8431/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,618,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8432/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,618,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8433/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,619,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8434/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,619,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8435/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,619,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8436/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,619,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8437/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,619,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8438/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=1,620,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8439/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,620,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8440/500000]
+ optim/total_grad_norm=1.272
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,620,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8441/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,620,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8442/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,620,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8443/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,621,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8444/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,621,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8445/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,621,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8446/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,621,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8447/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,621,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8448/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,622,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8449/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,622,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8450/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,622,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8451/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,622,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8452/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,622,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8453/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,622,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8454/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=1,623,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8455/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,623,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8456/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=1,623,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8457/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,623,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8458/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,623,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8459/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,624,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8460/500000]
+ optim/total_grad_norm=0.9842
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,624,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8461/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,624,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8462/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=1,624,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8463/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,624,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8464/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,625,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8465/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,625,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8466/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,625,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8467/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,625,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8468/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,625,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8469/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,626,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8470/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,626,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8471/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,626,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8472/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,626,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8473/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,626,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8474/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,627,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8475/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,627,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8476/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,627,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8477/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,627,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8478/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,627,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8479/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,627,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8480/500000]
+ optim/total_grad_norm=1.311
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,628,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8481/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,628,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8482/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,628,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8483/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,628,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8484/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,628,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8485/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,629,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8486/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,629,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8487/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,629,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8488/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,629,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8489/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,629,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8490/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,630,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8491/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=1,630,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8492/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,630,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8493/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,630,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8494/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,630,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8495/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,631,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8496/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,631,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8497/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,631,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8498/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,631,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8499/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=1,631,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8500/500000]
+ optim/total_grad_norm=1.411
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,632,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/04 [18:54:00] INFO | >> Saving config... checkpoint.py:608
+10/04 [18:54:41] INFO | >> Saving model state... checkpoint.py:796
+10/04 [18:55:55] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [18:57:29] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8501/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,632,192,000
+ throughput/device/tokens_per_second=1,194
+ throughput/device/batches_per_second=0.0498
+[step=8502/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,632,384,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=8503/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,632,576,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=8504/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,632,768,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=8505/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,632,960,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=8506/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,633,152,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=8507/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,633,344,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=8508/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,633,536,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=8509/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,633,728,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=8510/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,633,920,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8511/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,634,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8512/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,634,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8513/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,634,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8514/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,634,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8515/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,634,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8516/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,635,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8517/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,635,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8518/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,635,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8519/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,635,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8520/500000]
+ optim/total_grad_norm=1.137
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,635,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8521/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,636,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8522/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=1,636,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8523/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,636,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8524/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,636,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8525/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,636,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8526/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,636,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8527/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,637,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8528/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,637,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8529/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,637,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8530/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=1,637,760,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8531/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,637,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8532/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,638,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8533/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,638,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8534/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,638,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8535/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,638,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8536/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,638,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8537/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,639,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8538/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,639,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8539/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=1,639,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8540/500000]
+ optim/total_grad_norm=0.5842
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,639,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8541/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,639,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8542/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,640,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8543/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=1,640,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8544/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,640,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8545/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,640,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8546/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,640,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8547/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,641,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8548/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,641,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8549/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,641,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8550/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,641,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8551/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,641,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8552/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=1,641,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8553/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,642,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8554/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=1,642,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8555/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,642,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8556/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,642,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8557/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,642,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8558/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,643,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8559/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,643,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8560/500000]
+ optim/total_grad_norm=1.165
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,643,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8561/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,643,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8562/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,643,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8563/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,644,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8564/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,644,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8565/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,644,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8566/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,644,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8567/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,644,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8568/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,645,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8569/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,645,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8570/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,645,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8571/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,645,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8572/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,645,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8573/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,646,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8574/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,646,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8575/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=1,646,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8576/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,646,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8577/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,646,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8578/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,646,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8579/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,647,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8580/500000]
+ optim/total_grad_norm=1.167
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,647,360,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8581/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,647,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8582/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,647,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8583/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,647,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8584/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,648,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8585/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,648,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8586/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,648,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8587/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,648,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8588/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,648,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8589/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,649,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8590/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,649,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8591/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,649,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8592/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,649,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8593/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,649,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8594/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,650,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8595/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,650,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8596/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,650,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8597/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,650,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8598/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,650,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8599/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,651,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8600/500000]
+ optim/total_grad_norm=1.611
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=1,651,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8601/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,651,392,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8602/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=1,651,584,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8603/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,651,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8604/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,651,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8605/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,652,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8606/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,652,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8607/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,652,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8608/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,652,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8609/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,652,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8610/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=1,653,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8611/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,653,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8612/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,653,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8613/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,653,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8614/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,653,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8615/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,654,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8616/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,654,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8617/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,654,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8618/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,654,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8619/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,654,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8620/500000]
+ optim/total_grad_norm=1.978
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,655,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8621/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,655,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8622/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,655,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8623/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,655,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8624/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=1,655,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8625/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,656,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8626/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,656,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8627/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,656,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8628/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,656,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8629/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,656,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8630/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,656,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8631/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,657,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8632/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,657,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8633/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,657,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8634/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,657,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8635/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,657,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8636/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,658,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8637/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,658,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8638/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,658,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8639/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,658,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8640/500000]
+ optim/total_grad_norm=1.073
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,658,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8641/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,659,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8642/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,659,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8643/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,659,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8644/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,659,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8645/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,659,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8646/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,660,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8647/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,660,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8648/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,660,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8649/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=1,660,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8650/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,660,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8651/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,660,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8652/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=1,661,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8653/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,661,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8654/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,661,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8655/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=1,661,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8656/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,661,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8657/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,662,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8658/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,662,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8659/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,662,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8660/500000]
+ optim/total_grad_norm=1.655
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,662,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8661/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,662,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8662/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,663,104,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8663/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,663,296,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8664/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,663,488,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8665/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,663,680,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8666/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,663,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8667/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,664,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8668/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,664,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8669/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,664,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8670/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,664,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8671/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,664,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8672/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,665,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8673/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,665,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8674/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=1,665,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8675/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,665,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8676/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,665,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8677/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,665,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8678/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,666,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8679/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,666,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8680/500000]
+ optim/total_grad_norm=1.056
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,666,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8681/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=1,666,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8682/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,666,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8683/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,667,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8684/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,667,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8685/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,667,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8686/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,667,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8687/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,667,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8688/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=1,668,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8689/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,668,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8690/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,668,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8691/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,668,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8692/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,668,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8693/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,669,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8694/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,669,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8695/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,669,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8696/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,669,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8697/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,669,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8698/500000]
+ train/ActionNoiseL2Loss=0.1495
+ throughput/total_tokens=1,670,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8699/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,670,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8700/500000]
+ optim/total_grad_norm=1.493
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=1,670,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8701/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,670,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8702/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,670,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8703/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=1,670,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8704/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,671,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8705/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,671,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8706/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,671,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8707/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,671,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8708/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,671,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8709/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=1,672,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8710/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,672,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8711/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,672,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8712/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,672,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8713/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,672,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8714/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,673,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8715/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,673,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8716/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,673,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8717/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,673,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8718/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,673,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8719/500000]
+ train/ActionNoiseL2Loss=0.1255
+ throughput/total_tokens=1,674,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8720/500000]
+ optim/total_grad_norm=1.130
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,674,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8721/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,674,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8722/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,674,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8723/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,674,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8724/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,675,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8725/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,675,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8726/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,675,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8727/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,675,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8728/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,675,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8729/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,675,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8730/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=1,676,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8731/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,676,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8732/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,676,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8733/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,676,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8734/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,676,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8735/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,677,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8736/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,677,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8737/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,677,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8738/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,677,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8739/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,677,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8740/500000]
+ optim/total_grad_norm=1.339
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,678,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8741/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,678,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8742/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,678,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8743/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,678,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8744/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,678,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8745/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,679,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8746/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,679,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8747/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,679,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8748/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,679,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8749/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,679,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8750/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=1,680,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8751/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,680,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8752/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,680,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8753/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,680,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8754/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,680,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8755/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,680,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8756/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,681,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8757/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,681,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8758/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,681,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8759/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,681,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8760/500000]
+ optim/total_grad_norm=1.157
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,681,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8761/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,682,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8762/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,682,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8763/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,682,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8764/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,682,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8765/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,682,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8766/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,683,072,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8767/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,683,264,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8768/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,683,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8769/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,683,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8770/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,683,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8771/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,684,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8772/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,684,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8773/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,684,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8774/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,684,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8775/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,684,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8776/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,684,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8777/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,685,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8778/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,685,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8779/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=1,685,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8780/500000]
+ optim/total_grad_norm=1.614
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,685,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8781/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,685,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8782/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,686,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8783/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,686,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8784/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,686,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8785/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,686,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8786/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,686,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8787/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,687,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8788/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,687,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8789/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=1,687,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8790/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,687,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8791/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,687,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8792/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=1,688,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8793/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,688,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8794/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,688,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8795/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,688,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8796/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,688,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8797/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,689,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8798/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,689,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8799/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,689,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8800/500000]
+ optim/total_grad_norm=0.9311
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=1,689,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8801/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,689,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8802/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,689,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8803/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,690,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8804/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,690,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8805/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,690,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8806/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,690,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8807/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,690,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8808/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=1,691,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8809/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,691,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8810/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,691,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8811/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=1,691,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8812/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,691,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8813/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,692,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8814/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=1,692,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8815/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,692,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8816/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,692,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8817/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,692,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8818/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,693,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8819/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,693,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8820/500000]
+ optim/total_grad_norm=1.073
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,693,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8821/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,693,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8822/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,693,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8823/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=1,694,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8824/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,694,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8825/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=1,694,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8826/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,694,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8827/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,694,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8828/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,694,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8829/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,695,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8830/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,695,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8831/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,695,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8832/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=1,695,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8833/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=1,695,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8834/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,696,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8835/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=1,696,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8836/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,696,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8837/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,696,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8838/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=1,696,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8839/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,697,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8840/500000]
+ optim/total_grad_norm=2.082
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,697,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8841/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,697,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8842/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,697,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8843/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,697,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8844/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,698,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8845/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,698,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8846/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,698,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8847/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,698,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8848/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,698,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8849/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,699,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8850/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,699,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8851/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,699,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8852/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,699,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8853/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,699,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8854/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,699,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8855/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,700,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8856/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,700,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8857/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,700,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8858/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,700,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8859/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,700,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8860/500000]
+ optim/total_grad_norm=0.8753
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,701,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8861/500000]
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=1,701,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8862/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,701,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8863/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,701,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8864/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,701,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8865/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,702,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8866/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,702,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8867/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,702,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8868/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,702,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8869/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,702,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8870/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,703,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8871/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,703,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8872/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,703,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8873/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,703,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8874/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,703,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8875/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,704,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8876/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,704,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8877/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,704,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8878/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,704,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8879/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,704,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8880/500000]
+ optim/total_grad_norm=1.627
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,704,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8881/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,705,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8882/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,705,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8883/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,705,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8884/500000]
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=1,705,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8885/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,705,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8886/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,706,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8887/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,706,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8888/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,706,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8889/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,706,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8890/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,706,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8891/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,707,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8892/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,707,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8893/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,707,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8894/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,707,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8895/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,707,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8896/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,708,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8897/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,708,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8898/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,708,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8899/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,708,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8900/500000]
+ optim/total_grad_norm=1.761
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,708,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8901/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,708,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8902/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,709,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8903/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,709,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8904/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,709,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8905/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,709,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8906/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,709,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8907/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,710,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8908/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,710,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8909/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=1,710,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8910/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,710,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8911/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,710,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8912/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,711,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8913/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,711,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8914/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,711,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8915/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,711,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8916/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,711,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8917/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,712,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8918/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,712,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8919/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,712,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8920/500000]
+ optim/total_grad_norm=1.128
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,712,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8921/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,712,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8922/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,713,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8923/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,713,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8924/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,713,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8925/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,713,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8926/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,713,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8927/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,713,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8928/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,714,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8929/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,714,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8930/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,714,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8931/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,714,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8932/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,714,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8933/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,715,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8934/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,715,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8935/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,715,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8936/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,715,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8937/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,715,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8938/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,716,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8939/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,716,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8940/500000]
+ optim/total_grad_norm=1.357
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,716,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=8941/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=1,716,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8942/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,716,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8943/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,717,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8944/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,717,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8945/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,717,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8946/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,717,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8947/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,717,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8948/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,718,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8949/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=1,718,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8950/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,718,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8951/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,718,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8952/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,718,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8953/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,718,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8954/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,719,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8955/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,719,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8956/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,719,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8957/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,719,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8958/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,719,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8959/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,720,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8960/500000]
+ optim/total_grad_norm=1.118
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,720,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8961/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=1,720,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8962/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,720,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8963/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,720,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8964/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,721,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8965/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,721,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8966/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,721,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8967/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,721,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8968/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,721,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8969/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,722,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8970/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,722,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8971/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,722,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8972/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,722,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8973/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,722,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8974/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,723,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8975/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,723,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8976/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,723,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8977/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,723,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8978/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,723,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8979/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=1,723,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8980/500000]
+ optim/total_grad_norm=2.026
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,724,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8981/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,724,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8982/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,724,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8983/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,724,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8984/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,724,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8985/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,725,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8986/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,725,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8987/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,725,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8988/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,725,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8989/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,725,888,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8990/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,726,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=8991/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,726,272,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8992/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,726,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8993/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,726,656,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8994/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,726,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8995/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,727,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8996/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=1,727,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8997/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,727,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8998/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=1,727,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8999/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,727,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9000/500000]
+ optim/total_grad_norm=1.011
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,728,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+10/04 [21:51:16] INFO | >> Saving config... checkpoint.py:608
+10/04 [21:51:50] INFO | >> Saving model state... checkpoint.py:796
+10/04 [21:53:03] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [21:54:37] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9001/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,728,192,000
+ throughput/device/tokens_per_second=1,195
+ throughput/device/batches_per_second=0.0498
+[step=9002/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,728,384,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=9003/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,728,576,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=9004/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,728,768,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=9005/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,728,960,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=9006/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,729,152,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=9007/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,729,344,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=9008/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,729,536,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=9009/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=1,729,728,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=9010/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,729,920,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=9011/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,730,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9012/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,730,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9013/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,730,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9014/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,730,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9015/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,730,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9016/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,731,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9017/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,731,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9018/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,731,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9019/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=1,731,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9020/500000]
+ optim/total_grad_norm=1.702
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,731,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9021/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,732,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9022/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,732,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9023/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,732,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9024/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,732,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9025/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,732,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9026/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,732,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9027/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,733,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9028/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,733,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9029/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,733,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9030/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,733,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9031/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,733,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9032/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,734,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9033/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,734,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9034/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,734,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9035/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,734,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9036/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=1,734,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9037/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,735,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9038/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,735,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9039/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,735,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9040/500000]
+ optim/total_grad_norm=0.8301
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,735,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9041/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,735,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9042/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,736,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9043/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=1,736,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9044/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,736,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9045/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,736,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9046/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,736,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9047/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,737,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9048/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,737,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9049/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,737,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9050/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,737,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9051/500000]
+ train/ActionNoiseL2Loss=0.1415
+ throughput/total_tokens=1,737,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9052/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,737,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9053/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,738,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9054/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,738,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9055/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,738,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9056/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,738,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9057/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,738,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9058/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,739,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9059/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,739,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9060/500000]
+ optim/total_grad_norm=0.8552
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,739,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9061/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,739,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9062/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,739,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9063/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=1,740,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9064/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,740,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9065/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,740,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9066/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,740,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9067/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=1,740,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9068/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,741,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9069/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=1,741,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9070/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,741,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9071/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,741,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9072/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,741,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9073/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,742,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9074/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,742,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9075/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,742,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9076/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,742,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9077/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=1,742,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9078/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,742,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9079/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,743,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9080/500000]
+ optim/total_grad_norm=0.8798
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,743,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9081/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,743,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9082/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,743,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9083/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,743,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9084/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,744,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9085/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,744,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9086/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,744,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9087/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,744,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9088/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,744,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9089/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,745,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9090/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,745,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9091/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,745,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9092/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=1,745,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9093/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,745,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9094/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,746,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9095/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,746,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9096/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,746,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9097/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,746,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9098/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,746,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9099/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,747,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9100/500000]
+ optim/total_grad_norm=1.383
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,747,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9101/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,747,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9102/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,747,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9103/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,747,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9104/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,747,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9105/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,748,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9106/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,748,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9107/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,748,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9108/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,748,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9109/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,748,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9110/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,749,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9111/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,749,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9112/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,749,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9113/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,749,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9114/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=1,749,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9115/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,750,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9116/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,750,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9117/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,750,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9118/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,750,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9119/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,750,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9120/500000]
+ optim/total_grad_norm=1.394
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=1,751,040,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9121/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,751,232,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9122/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,751,424,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9123/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,751,616,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9124/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,751,808,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9125/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,752,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9126/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,752,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9127/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,752,384,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9128/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,752,576,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9129/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,752,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9130/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,752,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9131/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,753,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9132/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,753,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9133/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,753,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9134/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,753,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9135/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,753,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9136/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,754,112,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9137/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,754,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9138/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,754,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9139/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,754,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9140/500000]
+ optim/total_grad_norm=1.342
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,754,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9141/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,755,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9142/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=1,755,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9143/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,755,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9144/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,755,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9145/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,755,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9146/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,756,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9147/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,756,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9148/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,756,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9149/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,756,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9150/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,756,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9151/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,756,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9152/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,757,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9153/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,757,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9154/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,757,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9155/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,757,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9156/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=1,757,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9157/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,758,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9158/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,758,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9159/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,758,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9160/500000]
+ optim/total_grad_norm=1.200
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,758,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9161/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,758,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9162/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,759,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9163/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,759,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9164/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,759,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9165/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,759,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9166/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,759,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9167/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,760,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9168/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,760,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9169/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,760,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9170/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=1,760,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9171/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,760,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9172/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,761,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9173/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,761,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9174/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,761,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9175/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,761,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9176/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,761,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9177/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,761,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9178/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,762,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9179/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,762,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9180/500000]
+ optim/total_grad_norm=1.727
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,762,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9181/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,762,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9182/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,762,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9183/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,763,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9184/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,763,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9185/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=1,763,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9186/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,763,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9187/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,763,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9188/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,764,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9189/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,764,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9190/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,764,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9191/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,764,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9192/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=1,764,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9193/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,765,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9194/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,765,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9195/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=1,765,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9196/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,765,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9197/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=1,765,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9198/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,766,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9199/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,766,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9200/500000]
+ optim/total_grad_norm=1.294
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,766,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9201/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,766,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9202/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,766,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9203/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,766,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9204/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,767,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9205/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,767,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9206/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,767,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9207/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,767,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9208/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,767,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9209/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,768,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9210/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,768,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9211/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,768,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9212/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,768,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9213/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,768,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9214/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,769,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9215/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,769,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9216/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=1,769,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9217/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,769,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9218/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,769,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9219/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,770,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9220/500000]
+ optim/total_grad_norm=1.331
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,770,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9221/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,770,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9222/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,770,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9223/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,770,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9224/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,771,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9225/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,771,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9226/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=1,771,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9227/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,771,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9228/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,771,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9229/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,771,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9230/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,772,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9231/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,772,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9232/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,772,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9233/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,772,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9234/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,772,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9235/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,773,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9236/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,773,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9237/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,773,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9238/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,773,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9239/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,773,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9240/500000]
+ optim/total_grad_norm=1.385
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=1,774,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9241/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,774,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9242/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=1,774,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9243/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,774,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9244/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,774,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9245/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,775,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9246/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,775,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9247/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,775,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9248/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=1,775,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9249/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,775,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9250/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=1,776,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9251/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,776,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9252/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=1,776,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9253/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,776,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9254/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,776,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9255/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,776,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9256/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,777,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9257/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,777,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9258/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,777,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9259/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,777,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9260/500000]
+ optim/total_grad_norm=1.516
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,777,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9261/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,778,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9262/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,778,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9263/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,778,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9264/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,778,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9265/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,778,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9266/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,779,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9267/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,779,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9268/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=1,779,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9269/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,779,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9270/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,779,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9271/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=1,780,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9272/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=1,780,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9273/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,780,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9274/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,780,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9275/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=1,780,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9276/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,780,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9277/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,781,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9278/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,781,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9279/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,781,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9280/500000]
+ optim/total_grad_norm=2.031
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=1,781,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9281/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,781,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9282/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,782,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9283/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,782,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9284/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,782,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9285/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,782,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9286/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,782,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9287/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,783,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9288/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,783,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9289/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,783,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9290/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,783,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9291/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,783,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9292/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,784,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9293/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,784,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9294/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,784,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9295/500000]
+ train/ActionNoiseL2Loss=0.1492
+ throughput/total_tokens=1,784,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9296/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,784,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9297/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,785,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9298/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,785,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9299/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,785,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9300/500000]
+ optim/total_grad_norm=1.675
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,785,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9301/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,785,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9302/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,785,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9303/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,786,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9304/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,786,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9305/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,786,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9306/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=1,786,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9307/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,786,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9308/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,787,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9309/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,787,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9310/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,787,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9311/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,787,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9312/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,787,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9313/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,788,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9314/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,788,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9315/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,788,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9316/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,788,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9317/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=1,788,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9318/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,789,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9319/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,789,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9320/500000]
+ optim/total_grad_norm=1.211
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,789,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9321/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,789,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9322/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,789,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9323/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,790,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9324/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,790,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9325/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,790,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9326/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,790,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9327/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,790,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9328/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,790,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9329/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,791,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9330/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,791,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9331/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,791,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9332/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,791,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9333/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,791,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9334/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,792,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9335/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,792,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9336/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,792,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9337/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,792,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9338/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,792,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9339/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,793,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9340/500000]
+ optim/total_grad_norm=1.585
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=1,793,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9341/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,793,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9342/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=1,793,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9343/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,793,856,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9344/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,794,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9345/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,794,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9346/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=1,794,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9347/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,794,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9348/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,794,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9349/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=1,795,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9350/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,795,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9351/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,795,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9352/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,795,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9353/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,795,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9354/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,795,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9355/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,796,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9356/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,796,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9357/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=1,796,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9358/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,796,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9359/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,796,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9360/500000]
+ optim/total_grad_norm=1.036
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,797,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9361/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,797,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9362/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,797,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9363/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,797,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9364/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,797,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9365/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,798,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9366/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,798,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9367/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,798,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9368/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=1,798,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9369/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=1,798,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9370/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,799,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9371/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,799,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9372/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,799,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9373/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,799,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9374/500000]
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=1,799,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9375/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,800,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9376/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=1,800,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9377/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,800,384,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9378/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,800,576,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9379/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,800,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9380/500000]
+ optim/total_grad_norm=1.519
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,800,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9381/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,801,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9382/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,801,344,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9383/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,801,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9384/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,801,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9385/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,801,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9386/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,802,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9387/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,802,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9388/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,802,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9389/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,802,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9390/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,802,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9391/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,803,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9392/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,803,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9393/500000]
+ train/ActionNoiseL2Loss=0.1211
+ throughput/total_tokens=1,803,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9394/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,803,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9395/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=1,803,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9396/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,804,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9397/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,804,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9398/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,804,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9399/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,804,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9400/500000]
+ optim/total_grad_norm=0.9744
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,804,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9401/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,804,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9402/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,805,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9403/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,805,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9404/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,805,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9405/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,805,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9406/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,805,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9407/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,806,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9408/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,806,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9409/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,806,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9410/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,806,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9411/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,806,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9412/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,807,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9413/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,807,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9414/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,807,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9415/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,807,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9416/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,807,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9417/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,808,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9418/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,808,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9419/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,808,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9420/500000]
+ optim/total_grad_norm=1.383
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,808,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9421/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,808,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9422/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,809,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9423/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,809,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9424/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,809,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9425/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,809,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9426/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,809,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9427/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,809,984,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9428/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,810,176,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9429/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,810,368,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9430/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,810,560,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9431/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,810,752,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9432/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=1,810,944,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9433/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,811,136,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9434/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,811,328,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9435/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,811,520,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9436/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,811,712,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9437/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,811,904,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9438/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,812,096,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9439/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,812,288,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9440/500000]
+ optim/total_grad_norm=0.9151
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,812,480,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9441/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,812,672,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9442/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,812,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9443/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,813,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9444/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,813,248,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9445/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,813,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9446/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,813,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9447/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,813,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9448/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,814,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9449/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=1,814,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9450/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,814,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9451/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,814,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9452/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,814,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9453/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,814,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9454/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,815,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9455/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,815,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9456/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,815,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9457/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=1,815,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9458/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,815,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9459/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,816,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9460/500000]
+ optim/total_grad_norm=1.455
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,816,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9461/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=1,816,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9462/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,816,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9463/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,816,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9464/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,817,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9465/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,817,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9466/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,817,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9467/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,817,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9468/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,817,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9469/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,818,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9470/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,818,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9471/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,818,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9472/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,818,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9473/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,818,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9474/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,819,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9475/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,819,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9476/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,819,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9477/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,819,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9478/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,819,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9479/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,819,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9480/500000]
+ optim/total_grad_norm=1.004
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,820,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9481/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=1,820,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9482/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,820,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9483/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=1,820,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9484/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,820,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9485/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=1,821,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9486/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,821,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9487/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,821,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9488/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=1,821,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9489/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,821,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9490/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,822,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9491/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,822,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9492/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,822,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9493/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,822,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9494/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,822,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9495/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=1,823,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9496/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,823,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9497/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,823,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9498/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,823,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9499/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,823,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9500/500000]
+ optim/total_grad_norm=1.107
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,824,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/05 [00:48:30] INFO | >> Saving config... checkpoint.py:608
+10/05 [00:49:03] INFO | >> Saving model state... checkpoint.py:796
+10/05 [00:50:18] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [00:51:54] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9501/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=1,824,192,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=9502/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,824,384,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=9503/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,824,576,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=9504/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,824,768,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=9505/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=1,824,960,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=9506/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,825,152,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=9507/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,825,344,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=9508/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,825,536,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=9509/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=1,825,728,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=9510/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,825,920,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,467
+[step=9511/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,826,112,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=9512/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,826,304,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0485
+[step=9513/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,826,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9514/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,826,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9515/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,826,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9516/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,827,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9517/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,827,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9518/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,827,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9519/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,827,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9520/500000]
+ optim/total_grad_norm=1.203
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,827,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9521/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,828,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9522/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,828,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9523/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,828,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9524/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,828,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9525/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,828,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9526/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,828,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9527/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,829,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9528/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,829,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9529/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=1,829,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9530/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,829,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9531/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,829,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9532/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=1,830,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9533/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,830,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9534/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,830,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9535/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=1,830,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9536/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,830,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9537/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,831,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9538/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,831,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9539/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,831,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9540/500000]
+ optim/total_grad_norm=1.434
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,831,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9541/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,831,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9542/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,832,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9543/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,832,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9544/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=1,832,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9545/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,832,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9546/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,832,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9547/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,833,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9548/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=1,833,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9549/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,833,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9550/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,833,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9551/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,833,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9552/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,833,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9553/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,834,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9554/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,834,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9555/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,834,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9556/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,834,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9557/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,834,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9558/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,835,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9559/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,835,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9560/500000]
+ optim/total_grad_norm=1.554
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,835,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9561/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,835,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9562/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,835,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9563/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,836,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9564/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,836,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9565/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,836,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9566/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,836,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9567/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,836,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9568/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,837,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9569/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,837,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9570/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,837,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9571/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,837,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9572/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,837,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9573/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,838,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9574/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,838,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9575/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,838,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9576/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,838,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9577/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,838,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9578/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,838,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9579/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,839,168,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9580/500000]
+ optim/total_grad_norm=1.079
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,839,360,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9581/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,839,552,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9582/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,839,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9583/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,839,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9584/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=1,840,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9585/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,840,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9586/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,840,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9587/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=1,840,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9588/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,840,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9589/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,841,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9590/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,841,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9591/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,841,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9592/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,841,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9593/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,841,856,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9594/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,842,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9595/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,842,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9596/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,842,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9597/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,842,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9598/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,842,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9599/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,843,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9600/500000]
+ optim/total_grad_norm=1.182
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,843,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9601/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,843,392,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9602/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,843,584,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9603/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,843,776,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9604/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,843,968,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9605/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,844,160,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9606/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,844,352,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9607/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,844,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9608/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=1,844,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9609/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,844,928,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9610/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,845,120,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=46,467
+[step=9611/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=1,845,312,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9612/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,845,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9613/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,845,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9614/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,845,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9615/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,846,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9616/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=1,846,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9617/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,846,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9618/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=1,846,656,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9619/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,846,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9620/500000]
+ optim/total_grad_norm=1.233
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,847,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9621/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=1,847,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9622/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,847,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9623/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,847,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9624/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,847,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9625/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,848,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9626/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,848,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9627/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,848,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9628/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,848,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9629/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,848,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9630/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,848,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9631/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,849,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9632/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,849,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9633/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,849,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9634/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,849,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9635/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,849,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9636/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,850,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9637/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,850,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9638/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=1,850,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9639/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,850,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9640/500000]
+ optim/total_grad_norm=1.386
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=1,850,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9641/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,851,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9642/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=1,851,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9643/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,851,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9644/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,851,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9645/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,851,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9646/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,852,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9647/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,852,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9648/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,852,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9649/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,852,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9650/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,852,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9651/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,852,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9652/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,853,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9653/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,853,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9654/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,853,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9655/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,853,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9656/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,853,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9657/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,854,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9658/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,854,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9659/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,854,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9660/500000]
+ optim/total_grad_norm=1.420
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,854,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9661/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,854,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9662/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,855,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9663/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,855,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9664/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,855,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9665/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,855,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9666/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,855,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9667/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=1,856,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9668/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,856,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9669/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,856,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9670/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,856,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9671/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,856,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9672/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,857,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9673/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,857,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9674/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,857,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9675/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,857,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9676/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,857,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9677/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,857,984,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9678/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,858,176,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9679/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,858,368,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9680/500000]
+ optim/total_grad_norm=1.355
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,858,560,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9681/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,858,752,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9682/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=1,858,944,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9683/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,859,136,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9684/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,859,328,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9685/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,859,520,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9686/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,859,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9687/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,859,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9688/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,860,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9689/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,860,288,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9690/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,860,480,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9691/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,860,672,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9692/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,860,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9693/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,861,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9694/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,861,248,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9695/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,861,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9696/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,861,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9697/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,861,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9698/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,862,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9699/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,862,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9700/500000]
+ optim/total_grad_norm=1.678
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=1,862,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9701/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=1,862,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9702/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=1,862,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9703/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,862,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9704/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,863,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9705/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,863,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9706/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,863,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9707/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,863,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9708/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,863,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9709/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,864,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9710/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,864,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9711/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,864,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9712/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=1,864,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9713/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,864,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9714/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,865,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9715/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,865,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9716/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,865,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9717/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,865,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9718/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,865,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9719/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=1,866,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9720/500000]
+ optim/total_grad_norm=0.8578
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,866,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9721/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,866,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9722/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,866,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9723/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,866,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9724/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,867,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9725/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,867,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9726/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,867,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9727/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,867,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9728/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,867,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9729/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,867,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9730/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,868,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9731/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,868,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9732/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,868,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9733/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,868,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9734/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,868,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9735/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,869,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9736/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,869,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9737/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,869,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9738/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,869,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9739/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,869,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9740/500000]
+ optim/total_grad_norm=1.391
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,870,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9741/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,870,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9742/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,870,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9743/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,870,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9744/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,870,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9745/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=1,871,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9746/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=1,871,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9747/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,871,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9748/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,871,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9749/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=1,871,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9750/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,872,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9751/500000]
+ train/ActionNoiseL2Loss=0.1503
+ throughput/total_tokens=1,872,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9752/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,872,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9753/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=1,872,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9754/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,872,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9755/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,872,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9756/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,873,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9757/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,873,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9758/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,873,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9759/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,873,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9760/500000]
+ optim/total_grad_norm=1.562
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,873,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9761/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,874,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9762/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,874,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9763/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,874,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9764/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,874,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9765/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,874,880,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9766/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,875,072,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=9767/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,875,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=9768/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,875,456,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9769/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,875,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9770/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,875,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9771/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,876,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9772/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,876,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9773/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,876,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9774/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,876,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9775/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,876,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9776/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,876,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9777/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=1,877,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9778/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,877,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9779/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,877,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9780/500000]
+ optim/total_grad_norm=1.165
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,877,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9781/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,877,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9782/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=1,878,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9783/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,878,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9784/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,878,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9785/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,878,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9786/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,878,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9787/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,879,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9788/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,879,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9789/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,879,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9790/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,879,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9791/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,879,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9792/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,880,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9793/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,880,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9794/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,880,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9795/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,880,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9796/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=1,880,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9797/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,881,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9798/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,881,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9799/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,881,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9800/500000]
+ optim/total_grad_norm=1.314
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,881,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9801/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,881,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9802/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,881,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9803/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,882,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9804/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,882,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9805/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,882,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9806/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,882,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9807/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,882,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9808/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,883,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9809/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,883,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9810/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,883,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9811/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,883,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9812/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,883,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9813/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,884,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9814/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,884,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9815/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,884,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9816/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,884,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9817/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,884,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9818/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,885,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9819/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,885,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9820/500000]
+ optim/total_grad_norm=1.191
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,885,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9821/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,885,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9822/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=1,885,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9823/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,886,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9824/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,886,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9825/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,886,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9826/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,886,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9827/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,886,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9828/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,886,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9829/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,887,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9830/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,887,360,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9831/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,887,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9832/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,887,744,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9833/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,887,936,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9834/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,888,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9835/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,888,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9836/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,888,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9837/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,888,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9838/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,888,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9839/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,889,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9840/500000]
+ optim/total_grad_norm=1.018
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,889,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9841/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,889,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9842/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,889,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9843/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,889,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9844/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,890,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9845/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,890,240,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9846/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,890,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9847/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,890,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9848/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,890,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9849/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=1,891,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9850/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,891,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9851/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,891,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9852/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,891,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9853/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,891,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9854/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,891,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9855/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,892,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9856/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,892,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9857/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,892,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9858/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,892,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9859/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,892,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9860/500000]
+ optim/total_grad_norm=1.178
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,893,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9861/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,893,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9862/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,893,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9863/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,893,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9864/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=1,893,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9865/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,894,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9866/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,894,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9867/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,894,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9868/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,894,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9869/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,894,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9870/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,895,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9871/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,895,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9872/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,895,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9873/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,895,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9874/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,895,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9875/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,896,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9876/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,896,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9877/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,896,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9878/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,896,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9879/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,896,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9880/500000]
+ optim/total_grad_norm=1.326
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,896,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9881/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,897,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9882/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,897,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9883/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,897,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9884/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,897,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9885/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,897,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9886/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,898,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9887/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,898,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9888/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,898,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9889/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,898,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9890/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,898,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9891/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,899,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=9892/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,899,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9893/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,899,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9894/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,899,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9895/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,899,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9896/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,900,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9897/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,900,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9898/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,900,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9899/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,900,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9900/500000]
+ optim/total_grad_norm=0.8194
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,900,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9901/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,900,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9902/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,901,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9903/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,901,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9904/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,901,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9905/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,901,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9906/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,901,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9907/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,902,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9908/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,902,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9909/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,902,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9910/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,902,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9911/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,902,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9912/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,903,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9913/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,903,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9914/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,903,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9915/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,903,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9916/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,903,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9917/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,904,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9918/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,904,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9919/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,904,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9920/500000]
+ optim/total_grad_norm=0.7749
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,904,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9921/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,904,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9922/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,905,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9923/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,905,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9924/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,905,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9925/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=1,905,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9926/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,905,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9927/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,905,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9928/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,906,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9929/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,906,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9930/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,906,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9931/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,906,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9932/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,906,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9933/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,907,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9934/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,907,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9935/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,907,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9936/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,907,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9937/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,907,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9938/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,908,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9939/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,908,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9940/500000]
+ optim/total_grad_norm=1.402
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=1,908,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9941/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,908,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9942/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,908,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9943/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,909,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9944/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,909,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9945/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,909,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9946/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,909,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9947/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,909,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9948/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,910,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9949/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,910,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9950/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,910,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9951/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,910,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9952/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,910,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9953/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,910,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9954/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,911,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9955/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,911,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9956/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,911,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9957/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,911,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9958/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=1,911,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9959/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,912,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9960/500000]
+ optim/total_grad_norm=1.622
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,912,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9961/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,912,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9962/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,912,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9963/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,912,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9964/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,913,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9965/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,913,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9966/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=1,913,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9967/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,913,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9968/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,913,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9969/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,914,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9970/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,914,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9971/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,914,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9972/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,914,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9973/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,914,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9974/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,915,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9975/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,915,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9976/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,915,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9977/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,915,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9978/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,915,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9979/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,915,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9980/500000]
+ optim/total_grad_norm=1.016
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,916,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=9981/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,916,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9982/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,916,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9983/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,916,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9984/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,916,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9985/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,917,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9986/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,917,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9987/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,917,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9988/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,917,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9989/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,917,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9990/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,918,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=9991/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,918,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9992/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,918,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9993/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,918,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9994/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,918,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9995/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,919,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9996/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,919,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9997/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,919,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9998/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,919,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=9999/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=1,919,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10000/500000]
+ optim/total_grad_norm=1.592
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,920,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/05 [03:45:40] INFO | >> Saving config... checkpoint.py:608
+10/05 [03:46:42] INFO | >> Saving model state... checkpoint.py:796
+10/05 [03:47:52] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [03:49:26] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10001/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,920,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10002/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,920,384,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=10003/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,920,576,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=10004/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,920,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10005/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,920,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10006/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,921,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10007/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,921,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10008/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,921,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10009/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,921,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10010/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,921,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10011/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,922,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10012/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,922,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10013/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,922,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10014/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=1,922,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10015/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,922,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10016/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,923,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10017/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,923,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10018/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,923,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10019/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,923,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10020/500000]
+ optim/total_grad_norm=1.344
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,923,840,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10021/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,924,032,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10022/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,924,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10023/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=1,924,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10024/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,924,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10025/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,924,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10026/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,924,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10027/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,925,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10028/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,925,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10029/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,925,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10030/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,925,760,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10031/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,925,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10032/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,926,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10033/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,926,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10034/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=1,926,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10035/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,926,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10036/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,926,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10037/500000]
+ train/ActionNoiseL2Loss=0.1566
+ throughput/total_tokens=1,927,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10038/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,927,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10039/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,927,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10040/500000]
+ optim/total_grad_norm=0.7428
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,927,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10041/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,927,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10042/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,928,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10043/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,928,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10044/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,928,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10045/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,928,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10046/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=1,928,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10047/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,929,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10048/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,929,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10049/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=1,929,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10050/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,929,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10051/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,929,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10052/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,929,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10053/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=1,930,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10054/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,930,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10055/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,930,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10056/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,930,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10057/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,930,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10058/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,931,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10059/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,931,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10060/500000]
+ optim/total_grad_norm=1.041
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,931,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10061/500000]
+ train/ActionNoiseL2Loss=0.1921
+ throughput/total_tokens=1,931,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10062/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,931,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10063/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,932,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10064/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,932,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10065/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,932,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10066/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,932,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10067/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,932,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10068/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,933,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10069/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=1,933,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10070/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,933,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10071/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,933,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10072/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,933,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10073/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,934,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10074/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,934,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10075/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,934,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10076/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,934,592,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10077/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,934,784,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10078/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,934,976,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10079/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,935,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10080/500000]
+ optim/total_grad_norm=1.652
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,935,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10081/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,935,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10082/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,935,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10083/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,935,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10084/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,936,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10085/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,936,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10086/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,936,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10087/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,936,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10088/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,936,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10089/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,937,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10090/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,937,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10091/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,937,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10092/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,937,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10093/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,937,856,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10094/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,938,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10095/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,938,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10096/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,938,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10097/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,938,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10098/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,938,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10099/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,939,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10100/500000]
+ optim/total_grad_norm=1.293
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,939,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10101/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,939,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10102/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,939,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10103/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=1,939,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10104/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,939,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10105/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,940,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10106/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,940,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10107/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,940,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10108/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,940,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10109/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,940,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10110/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,941,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10111/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,941,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10112/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,941,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10113/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,941,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10114/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,941,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10115/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,942,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10116/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,942,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10117/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=1,942,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10118/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,942,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10119/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,942,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10120/500000]
+ optim/total_grad_norm=1.759
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,943,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10121/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,943,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10122/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,943,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10123/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,943,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10124/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=1,943,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10125/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,944,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10126/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,944,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10127/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,944,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10128/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,944,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10129/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,944,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10130/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,944,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10131/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,945,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10132/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,945,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10133/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,945,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10134/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,945,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10135/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=1,945,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10136/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,946,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10137/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,946,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10138/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,946,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10139/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,946,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10140/500000]
+ optim/total_grad_norm=1.118
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,946,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10141/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=1,947,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10142/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,947,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10143/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,947,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10144/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,947,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10145/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,947,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10146/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,948,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10147/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,948,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10148/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,948,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10149/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,948,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10150/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,948,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10151/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,948,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10152/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=1,949,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10153/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,949,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10154/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,949,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10155/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,949,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10156/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,949,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10157/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,950,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10158/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,950,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10159/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,950,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10160/500000]
+ optim/total_grad_norm=1.393
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,950,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10161/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,950,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10162/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=1,951,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10163/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,951,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10164/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,951,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10165/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,951,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10166/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,951,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10167/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,952,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10168/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,952,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10169/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,952,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10170/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=1,952,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10171/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,952,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10172/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,953,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10173/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,953,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10174/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,953,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10175/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,953,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10176/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=1,953,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10177/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,953,984,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10178/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=1,954,176,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10179/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,954,368,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10180/500000]
+ optim/total_grad_norm=1.522
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,954,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10181/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,954,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10182/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,954,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10183/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,955,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10184/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,955,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10185/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,955,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10186/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,955,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10187/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,955,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10188/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,956,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10189/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,956,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10190/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,956,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10191/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,956,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10192/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,956,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10193/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,957,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10194/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,957,248,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10195/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,957,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10196/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,957,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10197/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,957,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10198/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,958,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10199/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,958,208,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10200/500000]
+ optim/total_grad_norm=1.499
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,958,400,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10201/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,958,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10202/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,958,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10203/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,958,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10204/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,959,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10205/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,959,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10206/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,959,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10207/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,959,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10208/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=1,959,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10209/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,960,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10210/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,960,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10211/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,960,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10212/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,960,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10213/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,960,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10214/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,961,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10215/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,961,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10216/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,961,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10217/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,961,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10218/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,961,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10219/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,962,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10220/500000]
+ optim/total_grad_norm=0.8313
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,962,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10221/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,962,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10222/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,962,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10223/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,962,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10224/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,963,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10225/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,963,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10226/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,963,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10227/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,963,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10228/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,963,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10229/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,963,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10230/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=1,964,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10231/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,964,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10232/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,964,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10233/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,964,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10234/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,964,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10235/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,965,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10236/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,965,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10237/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,965,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10238/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,965,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10239/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,965,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10240/500000]
+ optim/total_grad_norm=1.095
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,966,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10241/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,966,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10242/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,966,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10243/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,966,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10244/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,966,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10245/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,967,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10246/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,967,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10247/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,967,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10248/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,967,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10249/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,967,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10250/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,968,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10251/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,968,192,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10252/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,968,384,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10253/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,968,576,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10254/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,968,768,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10255/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,968,960,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10256/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,969,152,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10257/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,969,344,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10258/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,969,536,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10259/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,969,728,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10260/500000]
+ optim/total_grad_norm=1.123
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,969,920,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=46,467
+[step=10261/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,970,112,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10262/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,970,304,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10263/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,970,496,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10264/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,970,688,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10265/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=1,970,880,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10266/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,971,072,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10267/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,971,264,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10268/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,971,456,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10269/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=1,971,648,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10270/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,971,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10271/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,972,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10272/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,972,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10273/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,972,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10274/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,972,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10275/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,972,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10276/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,972,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10277/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,973,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10278/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,973,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10279/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,973,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10280/500000]
+ optim/total_grad_norm=1.187
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,973,760,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10281/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,973,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10282/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,974,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10283/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,974,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10284/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,974,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10285/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,974,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10286/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,974,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10287/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,975,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10288/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,975,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10289/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,975,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10290/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,975,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10291/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,975,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10292/500000]
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=1,976,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10293/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,976,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10294/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,976,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10295/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,976,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10296/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,976,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10297/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,977,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10298/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,977,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10299/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,977,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10300/500000]
+ optim/total_grad_norm=1.140
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,977,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10301/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,977,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10302/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,977,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10303/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=1,978,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10304/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,978,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10305/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,978,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10306/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,978,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10307/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,978,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10308/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=1,979,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10309/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,979,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10310/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,979,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10311/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,979,712,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10312/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,979,904,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10313/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,980,096,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10314/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,980,288,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10315/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,980,480,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10316/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,980,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10317/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,980,864,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10318/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,981,056,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10319/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=1,981,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10320/500000]
+ optim/total_grad_norm=1.498
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,981,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10321/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,981,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10322/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,981,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10323/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,982,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10324/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,982,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10325/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,982,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10326/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,982,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10327/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,982,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10328/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,982,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10329/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,983,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10330/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,983,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10331/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,983,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10332/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,983,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10333/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,983,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10334/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,984,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10335/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,984,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10336/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,984,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10337/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,984,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10338/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,984,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10339/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,985,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10340/500000]
+ optim/total_grad_norm=0.9109
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,985,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10341/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,985,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10342/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,985,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10343/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,985,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10344/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,986,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10345/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,986,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10346/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,986,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10347/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,986,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10348/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=1,986,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10349/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,987,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10350/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=1,987,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10351/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,987,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10352/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,987,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10353/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=1,987,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10354/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,987,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10355/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,988,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10356/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,988,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10357/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,988,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10358/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,988,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10359/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,988,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10360/500000]
+ optim/total_grad_norm=1.340
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,989,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10361/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,989,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10362/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,989,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10363/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,989,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10364/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,989,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10365/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,990,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10366/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,990,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10367/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,990,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10368/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,990,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10369/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,990,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10370/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=1,991,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10371/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,991,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10372/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=1,991,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10373/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,991,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10374/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,991,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10375/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,992,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10376/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,992,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10377/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,992,384,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10378/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,992,576,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10379/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,992,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10380/500000]
+ optim/total_grad_norm=1.652
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=1,992,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10381/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,993,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10382/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,993,344,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10383/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=1,993,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10384/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,993,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10385/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,993,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10386/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,994,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10387/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=1,994,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10388/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,994,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10389/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=1,994,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10390/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,994,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10391/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,995,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10392/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,995,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10393/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,995,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10394/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,995,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10395/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,995,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10396/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,996,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10397/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,996,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10398/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,996,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10399/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,996,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10400/500000]
+ optim/total_grad_norm=1.021
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,996,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10401/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,996,992,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10402/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,997,184,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10403/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=1,997,376,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10404/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,997,568,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10405/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,997,760,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10406/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,997,952,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10407/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,998,144,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10408/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,998,336,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10409/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,998,528,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10410/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,998,720,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10411/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,998,912,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10412/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,999,104,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10413/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,999,296,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10414/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,999,488,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10415/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,999,680,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10416/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,999,872,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10417/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,000,064,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10418/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,000,256,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10419/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,000,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=10420/500000]
+ optim/total_grad_norm=1.060
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=2,000,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10421/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,000,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10422/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=2,001,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10423/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,001,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10424/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,001,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10425/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=2,001,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10426/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=2,001,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10427/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,001,984,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10428/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=2,002,176,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10429/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,002,368,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10430/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=2,002,560,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10431/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,002,752,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10432/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,002,944,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10433/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=2,003,136,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10434/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,003,328,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10435/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,003,520,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10436/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,003,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10437/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,003,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10438/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,004,096,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10439/500000]
+ train/ActionNoiseL2Loss=0.1617
+ throughput/total_tokens=2,004,288,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10440/500000]
+ optim/total_grad_norm=1.234
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,004,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10441/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,004,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10442/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=2,004,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10443/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,005,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10444/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=2,005,248,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10445/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=2,005,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10446/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,005,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10447/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=2,005,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10448/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=2,006,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10449/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,006,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10450/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=2,006,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10451/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=2,006,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10452/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,006,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10453/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,006,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10454/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=2,007,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10455/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=2,007,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10456/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,007,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10457/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=2,007,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10458/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,007,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10459/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,008,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10460/500000]
+ optim/total_grad_norm=1.450
+ train/ActionNoiseL2Loss=0.1228
+ throughput/total_tokens=2,008,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10461/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=2,008,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10462/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=2,008,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10463/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,008,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10464/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=2,009,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10465/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,009,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10466/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=2,009,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10467/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=2,009,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10468/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,009,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10469/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=2,010,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10470/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=2,010,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10471/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=2,010,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10472/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=2,010,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10473/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=2,010,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10474/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,011,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10475/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=2,011,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10476/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=2,011,392,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10477/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,011,584,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10478/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,011,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10479/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=2,011,968,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10480/500000]
+ optim/total_grad_norm=1.275
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,012,160,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10481/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,012,352,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10482/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,012,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10483/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,012,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10484/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,012,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10485/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=2,013,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10486/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,013,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10487/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,013,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10488/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,013,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10489/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=2,013,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10490/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=2,014,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10491/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,014,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10492/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=2,014,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10493/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=2,014,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10494/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=2,014,848,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10495/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=2,015,040,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10496/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=2,015,232,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10497/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,015,424,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10498/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,015,616,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10499/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,015,808,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10500/500000]
+ optim/total_grad_norm=1.468
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=2,016,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+10/05 [06:43:27] INFO | >> Saving config... checkpoint.py:608
+10/05 [06:44:12] INFO | >> Saving model state... checkpoint.py:796
+10/05 [06:45:26] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [06:47:02] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10501/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=2,016,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10502/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,016,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10503/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=2,016,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10504/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=2,016,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10505/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,016,960,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=10506/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=2,017,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10507/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,017,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10508/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=2,017,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10509/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=2,017,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10510/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=2,017,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10511/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=2,018,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10512/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,018,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10513/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=2,018,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=10514/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=2,018,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=10515/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,018,880,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=10516/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,019,072,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10517/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,019,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10518/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,019,456,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10519/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=2,019,648,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10520/500000]
+ optim/total_grad_norm=0.8856
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,019,840,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10521/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,020,032,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10522/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=2,020,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10523/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=2,020,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10524/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,020,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10525/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=2,020,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10526/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=2,020,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10527/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=2,021,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10528/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,021,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10529/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=2,021,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10530/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=2,021,760,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10531/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,021,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10532/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=2,022,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10533/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,022,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10534/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=2,022,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10535/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=2,022,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10536/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=2,022,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10537/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=2,023,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10538/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=2,023,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10539/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=2,023,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10540/500000]
+ optim/total_grad_norm=0.8485
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,023,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10541/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,023,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10542/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=2,024,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10543/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,024,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10544/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=2,024,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10545/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=2,024,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10546/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,024,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10547/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=2,025,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10548/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,025,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10549/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,025,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10550/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,025,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10551/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,025,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10552/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=2,025,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10553/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,026,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10554/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,026,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10555/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,026,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10556/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,026,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10557/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=2,026,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10558/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,027,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10559/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,027,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10560/500000]
+ optim/total_grad_norm=1.355
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,027,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10561/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=2,027,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10562/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,027,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10563/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=2,028,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10564/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=2,028,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10565/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=2,028,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10566/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,028,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10567/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,028,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10568/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,029,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10569/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,029,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10570/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=2,029,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10571/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=2,029,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10572/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,029,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10573/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,030,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10574/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=2,030,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10575/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,030,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10576/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=2,030,592,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10577/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=2,030,784,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10578/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,030,976,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10579/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=2,031,168,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10580/500000]
+ optim/total_grad_norm=1.673
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=2,031,360,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10581/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=2,031,552,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10582/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=2,031,744,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10583/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,031,936,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10584/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,032,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10585/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=2,032,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10586/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=2,032,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10587/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=2,032,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10588/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,032,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10589/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=2,033,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10590/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=2,033,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10591/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,033,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10592/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=2,033,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10593/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=2,033,856,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10594/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=2,034,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10595/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,034,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10596/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,034,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10597/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,034,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10598/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,034,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10599/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,035,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10600/500000]
+ optim/total_grad_norm=1.042
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,035,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10601/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=2,035,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10602/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,035,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10603/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,035,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10604/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,035,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10605/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,036,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10606/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=2,036,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10607/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,036,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10608/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,036,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10609/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,036,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10610/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=2,037,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10611/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=2,037,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10612/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,037,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10613/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=2,037,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10614/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=2,037,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10615/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=2,038,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10616/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=2,038,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10617/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,038,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10618/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=2,038,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10619/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,038,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10620/500000]
+ optim/total_grad_norm=1.232
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,039,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10621/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,039,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10622/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=2,039,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10623/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=2,039,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10624/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,039,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10625/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=2,040,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10626/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,040,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10627/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=2,040,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10628/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=2,040,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10629/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,040,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10630/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,040,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10631/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,041,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10632/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,041,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10633/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=2,041,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10634/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,041,728,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10635/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=2,041,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10636/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,042,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10637/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=2,042,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10638/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,042,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10639/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,042,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10640/500000]
+ optim/total_grad_norm=1.273
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,042,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10641/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,043,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10642/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,043,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10643/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,043,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10644/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,043,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10645/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,043,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10646/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=2,044,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10647/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,044,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10648/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=2,044,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10649/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,044,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10650/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=2,044,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10651/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,044,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10652/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,045,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10653/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=2,045,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10654/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=2,045,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10655/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=2,045,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10656/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,045,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10657/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=2,046,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10658/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,046,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10659/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=2,046,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10660/500000]
+ optim/total_grad_norm=1.031
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=2,046,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10661/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,046,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10662/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=2,047,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10663/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,047,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10664/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,047,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10665/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,047,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10666/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,047,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10667/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=2,048,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10668/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,048,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10669/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,048,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10670/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,048,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10671/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=2,048,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10672/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=2,049,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10673/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,049,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10674/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,049,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10675/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,049,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10676/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=2,049,792,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10677/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,049,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10678/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=2,050,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10679/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,050,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10680/500000]
+ optim/total_grad_norm=1.513
+ train/ActionNoiseL2Loss=0.1573
+ throughput/total_tokens=2,050,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10681/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=2,050,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10682/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,050,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10683/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=2,051,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10684/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=2,051,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10685/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=2,051,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10686/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=2,051,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10687/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,051,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10688/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,052,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10689/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,052,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10690/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,052,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10691/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,052,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10692/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,052,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10693/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=2,053,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10694/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,053,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10695/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=2,053,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10696/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,053,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10697/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,053,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10698/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=2,054,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10699/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,054,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10700/500000]
+ optim/total_grad_norm=1.258
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,054,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10701/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,054,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10702/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,054,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10703/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=2,054,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10704/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=2,055,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10705/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=2,055,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10706/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,055,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10707/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=2,055,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10708/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,055,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10709/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=2,056,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10710/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,056,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10711/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,056,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10712/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=2,056,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10713/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,056,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10714/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=2,057,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10715/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,057,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10716/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=2,057,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10717/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,057,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10718/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=2,057,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10719/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,058,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10720/500000]
+ optim/total_grad_norm=1.526
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,058,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10721/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=2,058,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10722/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=2,058,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10723/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=2,058,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10724/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=2,059,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10725/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,059,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10726/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,059,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10727/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,059,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10728/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=2,059,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10729/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,059,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10730/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,060,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10731/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=2,060,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10732/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=2,060,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10733/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,060,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10734/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,060,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10735/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=2,061,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10736/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=2,061,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10737/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=2,061,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10738/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=2,061,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10739/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=2,061,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10740/500000]
+ optim/total_grad_norm=1.387
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=2,062,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10741/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=2,062,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10742/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=2,062,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10743/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=2,062,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10744/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=2,062,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10745/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=2,063,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10746/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=2,063,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10747/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,063,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10748/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,063,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10749/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,063,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10750/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,064,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10751/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=2,064,192,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10752/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=2,064,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10753/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,064,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10754/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=2,064,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10755/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=2,064,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10756/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=2,065,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10757/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=2,065,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10758/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=2,065,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10759/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,065,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10760/500000]
+ optim/total_grad_norm=1.462
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=2,065,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10761/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=2,066,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10762/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=2,066,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10763/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,066,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10764/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,066,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10765/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,066,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10766/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=2,067,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10767/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,067,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10768/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=2,067,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10769/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,067,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10770/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,067,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10771/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=2,068,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10772/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=2,068,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10773/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=2,068,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10774/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,068,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10775/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=2,068,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10776/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=2,068,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10777/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,069,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10778/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=2,069,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10779/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=2,069,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10780/500000]
+ optim/total_grad_norm=1.371
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,069,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10781/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=2,069,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10782/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,070,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10783/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=2,070,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10784/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,070,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10785/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,070,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10786/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,070,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10787/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,071,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10788/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=2,071,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10789/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,071,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10790/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,071,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10791/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=2,071,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10792/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=2,072,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10793/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,072,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10794/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=2,072,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10795/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,072,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10796/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=2,072,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10797/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=2,073,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10798/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,073,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10799/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,073,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10800/500000]
+ optim/total_grad_norm=1.119
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,073,600,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10801/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,073,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10802/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,073,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10803/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,074,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10804/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,074,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10805/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,074,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10806/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=2,074,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10807/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,074,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10808/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=2,075,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10809/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,075,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10810/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,075,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10811/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=2,075,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10812/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=2,075,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10813/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,076,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10814/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=2,076,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10815/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=2,076,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10816/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,076,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10817/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,076,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10818/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=2,077,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10819/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=2,077,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10820/500000]
+ optim/total_grad_norm=0.9390
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,077,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10821/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,077,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10822/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=2,077,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10823/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,078,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10824/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=2,078,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10825/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=2,078,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10826/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=2,078,592,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10827/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,078,784,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10828/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,078,976,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10829/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,079,168,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10830/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=2,079,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10831/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=2,079,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10832/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=2,079,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10833/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=2,079,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10834/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,080,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10835/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=2,080,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10836/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=2,080,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10837/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,080,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10838/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=2,080,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10839/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=2,081,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10840/500000]
+ optim/total_grad_norm=0.8562
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,081,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10841/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=2,081,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10842/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,081,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10843/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=2,081,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10844/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=2,082,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10845/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=2,082,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10846/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=2,082,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10847/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,082,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10848/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=2,082,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10849/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,083,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10850/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,083,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10851/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=2,083,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10852/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=2,083,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10853/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=2,083,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10854/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,083,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10855/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,084,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10856/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=2,084,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10857/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=2,084,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10858/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=2,084,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10859/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,084,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10860/500000]
+ optim/total_grad_norm=1.003
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=2,085,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10861/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,085,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10862/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=2,085,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10863/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=2,085,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10864/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,085,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10865/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,086,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10866/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=2,086,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10867/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=2,086,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10868/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,086,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10869/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=2,086,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10870/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=2,087,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10871/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=2,087,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10872/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,087,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10873/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=2,087,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10874/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,087,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10875/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=2,088,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10876/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,088,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10877/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,088,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10878/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,088,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10879/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,088,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10880/500000]
+ optim/total_grad_norm=1.319
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,088,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10881/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=2,089,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10882/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=2,089,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10883/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,089,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10884/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,089,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10885/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,089,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10886/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,090,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10887/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,090,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10888/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=2,090,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10889/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,090,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10890/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,090,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10891/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=2,091,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10892/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,091,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10893/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=2,091,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10894/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=2,091,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10895/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=2,091,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10896/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,092,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10897/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=2,092,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10898/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,092,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10899/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,092,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10900/500000]
+ optim/total_grad_norm=1.667
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=2,092,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10901/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=2,092,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10902/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,093,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10903/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,093,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10904/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=2,093,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10905/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,093,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10906/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,093,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10907/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,094,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10908/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,094,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10909/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,094,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10910/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=2,094,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10911/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=2,094,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10912/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,095,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10913/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,095,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10914/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,095,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10915/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=2,095,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10916/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=2,095,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10917/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,096,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10918/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=2,096,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10919/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=2,096,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10920/500000]
+ optim/total_grad_norm=1.610
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=2,096,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10921/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,096,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10922/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,097,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10923/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,097,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10924/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=2,097,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10925/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=2,097,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10926/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=2,097,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10927/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=2,097,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10928/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,098,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10929/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=2,098,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10930/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,098,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10931/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,098,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10932/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,098,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10933/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,099,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10934/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,099,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10935/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,099,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10936/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,099,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10937/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=2,099,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10938/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,100,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10939/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=2,100,288,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10940/500000]
+ optim/total_grad_norm=1.405
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,100,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10941/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,100,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10942/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=2,100,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10943/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=2,101,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10944/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=2,101,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10945/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,101,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10946/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,101,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10947/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,101,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10948/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=2,102,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10949/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,102,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10950/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,102,400,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=10951/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=2,102,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10952/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=2,102,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10953/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,102,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10954/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=2,103,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10955/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=2,103,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10956/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,103,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10957/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=2,103,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10958/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=2,103,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10959/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=2,104,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10960/500000]
+ optim/total_grad_norm=1.896
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=2,104,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10961/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=2,104,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10962/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,104,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10963/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=2,104,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10964/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,105,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10965/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,105,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10966/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,105,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10967/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=2,105,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10968/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,105,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10969/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,106,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10970/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=2,106,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10971/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,106,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10972/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=2,106,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10973/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,106,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10974/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=2,107,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10975/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,107,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10976/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,107,392,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10977/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=2,107,584,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10978/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,107,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10979/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=2,107,968,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10980/500000]
+ optim/total_grad_norm=1.097
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,108,160,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10981/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=2,108,352,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10982/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=2,108,544,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10983/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=2,108,736,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10984/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,108,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10985/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,109,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10986/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=2,109,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10987/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=2,109,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10988/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=2,109,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10989/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=2,109,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10990/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,110,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=10991/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,110,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10992/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=2,110,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10993/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=2,110,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10994/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=2,110,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10995/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=2,111,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10996/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=2,111,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10997/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,111,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10998/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=2,111,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10999/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,111,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11000/500000]
+ optim/total_grad_norm=1.045
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,112,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+10/05 [09:41:08] INFO | >> Saving config... checkpoint.py:608
+10/05 [09:41:41] INFO | >> Saving model state... checkpoint.py:796
+10/05 [09:42:55] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [09:44:21] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11001/500000]
+ train/ActionNoiseL2Loss=0.1556
+ throughput/total_tokens=2,112,192,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=11002/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,112,384,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11003/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=2,112,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11004/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=2,112,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11005/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,112,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11006/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,113,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11007/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,113,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11008/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=2,113,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11009/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,113,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11010/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=2,113,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11011/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,114,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11012/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=2,114,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11013/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,114,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11014/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=2,114,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11015/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=2,114,880,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11016/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,115,072,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11017/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=2,115,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11018/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,115,456,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11019/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,115,648,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11020/500000]
+ optim/total_grad_norm=1.215
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,115,840,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11021/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,116,032,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11022/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,116,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11023/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,116,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11024/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,116,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11025/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=2,116,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11026/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,116,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11027/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,117,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11028/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,117,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11029/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,117,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11030/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,117,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11031/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=2,117,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11032/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=2,118,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11033/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,118,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11034/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,118,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11035/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,118,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11036/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,118,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11037/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,119,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11038/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=2,119,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11039/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=2,119,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11040/500000]
+ optim/total_grad_norm=1.237
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=2,119,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11041/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,119,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11042/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,120,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11043/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,120,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11044/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=2,120,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11045/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,120,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11046/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,120,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11047/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=2,121,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11048/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,121,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11049/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,121,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11050/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=2,121,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11051/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=2,121,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11052/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,121,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11053/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,122,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11054/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,122,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11055/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=2,122,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11056/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,122,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11057/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=2,122,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11058/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=2,123,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11059/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,123,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11060/500000]
+ optim/total_grad_norm=0.9460
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=2,123,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11061/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,123,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11062/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,123,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11063/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,124,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11064/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=2,124,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11065/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,124,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11066/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,124,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11067/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=2,124,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11068/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,125,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11069/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=2,125,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11070/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=2,125,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11071/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,125,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11072/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,125,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11073/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,126,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11074/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=2,126,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11075/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,126,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11076/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=2,126,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11077/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,126,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11078/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=2,126,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11079/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,127,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11080/500000]
+ optim/total_grad_norm=1.316
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,127,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11081/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,127,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11082/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=2,127,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11083/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,127,936,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11084/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,128,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11085/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=2,128,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11086/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=2,128,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11087/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=2,128,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11088/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,128,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11089/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,129,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11090/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,129,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11091/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,129,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11092/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=2,129,664,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11093/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,129,856,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11094/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,130,048,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11095/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,130,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11096/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,130,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11097/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=2,130,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11098/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,130,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11099/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,131,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11100/500000]
+ optim/total_grad_norm=1.164
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=2,131,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11101/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=2,131,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11102/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=2,131,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11103/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,131,776,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11104/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=2,131,968,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11105/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=2,132,160,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11106/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,132,352,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11107/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,132,544,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11108/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=2,132,736,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11109/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=2,132,928,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11110/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=2,133,120,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11111/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,133,312,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11112/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,133,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11113/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,133,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11114/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,133,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11115/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,134,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11116/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=2,134,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11117/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,134,464,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11118/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=2,134,656,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11119/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=2,134,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11120/500000]
+ optim/total_grad_norm=2.007
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=2,135,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11121/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=2,135,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11122/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,135,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11123/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,135,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11124/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,135,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11125/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,136,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11126/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=2,136,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11127/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=2,136,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11128/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=2,136,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11129/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,136,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11130/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,136,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11131/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,137,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11132/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,137,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11133/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=2,137,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11134/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=2,137,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11135/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=2,137,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11136/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=2,138,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11137/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,138,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11138/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,138,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11139/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,138,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11140/500000]
+ optim/total_grad_norm=1.249
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=2,138,880,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11141/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,139,072,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11142/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,139,264,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11143/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,139,456,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11144/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,139,648,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11145/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=2,139,840,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11146/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,140,032,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11147/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=2,140,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11148/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=2,140,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11149/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,140,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11150/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,140,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11151/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=2,140,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11152/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,141,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11153/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,141,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11154/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,141,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11155/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,141,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11156/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=2,141,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11157/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=2,142,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11158/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,142,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11159/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=2,142,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11160/500000]
+ optim/total_grad_norm=1.084
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,142,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11161/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,142,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11162/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,143,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11163/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,143,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11164/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=2,143,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11165/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,143,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11166/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,143,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11167/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=2,144,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11168/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,144,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11169/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=2,144,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11170/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,144,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11171/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=2,144,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11172/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,145,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11173/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=2,145,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11174/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,145,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11175/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,145,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11176/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=2,145,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11177/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=2,145,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11178/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,146,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11179/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=2,146,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11180/500000]
+ optim/total_grad_norm=1.291
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,146,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11181/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=2,146,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11182/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,146,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11183/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=2,147,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11184/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,147,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11185/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,147,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11186/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,147,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11187/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,147,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11188/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,148,096,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11189/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=2,148,288,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11190/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=2,148,480,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11191/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,148,672,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11192/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=2,148,864,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11193/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=2,149,056,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11194/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=2,149,248,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11195/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,149,440,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11196/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=2,149,632,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11197/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,149,824,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11198/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=2,150,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11199/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=2,150,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11200/500000]
+ optim/total_grad_norm=1.349
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,150,400,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11201/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=2,150,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11202/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=2,150,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11203/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,150,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11204/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=2,151,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11205/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=2,151,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11206/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=2,151,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11207/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,151,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11208/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,151,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11209/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,152,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11210/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,152,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11211/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=2,152,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11212/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,152,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11213/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,152,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11214/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,153,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11215/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=2,153,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11216/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,153,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11217/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,153,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11218/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=2,153,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11219/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,154,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11220/500000]
+ optim/total_grad_norm=1.808
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=2,154,240,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11221/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,154,432,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11222/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,154,624,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11223/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=2,154,816,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11224/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,155,008,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11225/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=2,155,200,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11226/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,155,392,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11227/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,155,584,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11228/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,155,776,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11229/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=2,155,968,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11230/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=2,156,160,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11231/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,156,352,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11232/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=2,156,544,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11233/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,156,736,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11234/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=2,156,928,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11235/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,157,120,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11236/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,157,312,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11237/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=2,157,504,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11238/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,157,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11239/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=2,157,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11240/500000]
+ optim/total_grad_norm=0.7773
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,158,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11241/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,158,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11242/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,158,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11243/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=2,158,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11244/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=2,158,848,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11245/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=2,159,040,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11246/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,159,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11247/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,159,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11248/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,159,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11249/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,159,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11250/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=2,160,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11251/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=2,160,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11252/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=2,160,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11253/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,160,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11254/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,160,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11255/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,160,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11256/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,161,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11257/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,161,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11258/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,161,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11259/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,161,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11260/500000]
+ optim/total_grad_norm=1.109
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,161,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11261/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=2,162,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11262/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,162,304,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11263/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=2,162,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11264/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,162,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11265/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=2,162,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11266/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,163,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11267/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=2,163,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11268/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,163,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11269/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=2,163,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11270/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=2,163,840,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11271/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=2,164,032,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11272/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,164,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11273/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,164,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11274/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=2,164,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11275/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=2,164,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11276/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=2,164,992,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11277/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,165,184,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11278/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,165,376,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11279/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=2,165,568,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11280/500000]
+ optim/total_grad_norm=1.203
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,165,760,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11281/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,165,952,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11282/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,166,144,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11283/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,166,336,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11284/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,166,528,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11285/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,166,720,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11286/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=2,166,912,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11287/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,167,104,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11288/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=2,167,296,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11289/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=2,167,488,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11290/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,167,680,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11291/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=2,167,872,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11292/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,168,064,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11293/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,168,256,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11294/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=2,168,448,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11295/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,168,640,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11296/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,168,832,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11297/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=2,169,024,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11298/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=2,169,216,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11299/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,169,408,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11300/500000]
+ optim/total_grad_norm=1.508
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,169,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11301/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=2,169,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11302/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=2,169,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11303/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,170,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11304/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,170,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11305/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=2,170,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11306/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=2,170,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11307/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=2,170,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11308/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=2,171,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11309/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,171,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11310/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,171,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11311/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,171,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11312/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,171,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11313/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=2,172,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11314/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,172,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11315/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=2,172,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11316/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=2,172,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11317/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,172,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11318/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=2,173,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11319/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=2,173,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11320/500000]
+ optim/total_grad_norm=1.620
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,173,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11321/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=2,173,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11322/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,173,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11323/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=2,174,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11324/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=2,174,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11325/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,174,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11326/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,174,592,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11327/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=2,174,784,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11328/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=2,174,976,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11329/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=2,175,168,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11330/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,175,360,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11331/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=2,175,552,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11332/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,175,744,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11333/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,175,936,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11334/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=2,176,128,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11335/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=2,176,320,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11336/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=2,176,512,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11337/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,176,704,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11338/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,176,896,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11339/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,177,088,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11340/500000]
+ optim/total_grad_norm=1.433
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=2,177,280,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11341/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=2,177,472,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11342/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=2,177,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11343/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,177,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11344/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,178,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11345/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=2,178,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11346/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,178,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11347/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,178,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11348/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=2,178,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11349/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=2,179,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11350/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,179,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11351/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=2,179,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11352/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=2,179,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11353/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,179,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11354/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=2,179,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11355/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,180,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11356/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,180,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11357/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,180,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11358/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,180,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11359/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,180,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11360/500000]
+ optim/total_grad_norm=1.020
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=2,181,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11361/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=2,181,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11362/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,181,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11363/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=2,181,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11364/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,181,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11365/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=2,182,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11366/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,182,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11367/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=2,182,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11368/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=2,182,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11369/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=2,182,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11370/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=2,183,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11371/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=2,183,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11372/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,183,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11373/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,183,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11374/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=2,183,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11375/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=2,184,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11376/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,184,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11377/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=2,184,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11378/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,184,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11379/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,184,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11380/500000]
+ optim/total_grad_norm=1.033
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=2,184,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11381/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,185,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11382/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,185,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11383/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,185,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11384/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=2,185,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11385/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,185,920,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11386/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,186,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11387/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,186,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11388/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,186,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11389/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,186,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11390/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,186,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11391/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,187,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11392/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,187,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11393/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=2,187,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11394/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,187,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11395/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=2,187,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11396/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,188,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11397/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=2,188,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11398/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,188,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11399/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,188,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11400/500000]
+ optim/total_grad_norm=1.544
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,188,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11401/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=2,188,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11402/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=2,189,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11403/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,189,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11404/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=2,189,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11405/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,189,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11406/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=2,189,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11407/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,190,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11408/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=2,190,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11409/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,190,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11410/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=2,190,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11411/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,190,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11412/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,191,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11413/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,191,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11414/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,191,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11415/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=2,191,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11416/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,191,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11417/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,192,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11418/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,192,256,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11419/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,192,448,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11420/500000]
+ optim/total_grad_norm=1.058
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,192,640,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11421/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,192,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11422/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,193,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11423/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,193,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11424/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=2,193,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11425/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=2,193,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11426/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,193,792,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11427/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,193,984,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11428/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=2,194,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11429/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,194,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11430/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,194,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11431/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,194,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11432/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,194,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11433/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,195,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11434/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=2,195,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11435/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,195,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11436/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,195,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11437/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,195,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11438/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=2,196,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11439/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=2,196,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11440/500000]
+ optim/total_grad_norm=1.166
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=2,196,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11441/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,196,672,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11442/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,196,864,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11443/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,197,056,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11444/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,197,248,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11445/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=2,197,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11446/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,197,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11447/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=2,197,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11448/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,198,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11449/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,198,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11450/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=2,198,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11451/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,198,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11452/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=2,198,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11453/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=2,198,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11454/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=2,199,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11455/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,199,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11456/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=2,199,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11457/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,199,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11458/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=2,199,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11459/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,200,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11460/500000]
+ optim/total_grad_norm=1.262
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,200,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11461/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,200,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11462/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,200,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11463/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,200,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11464/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,201,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11465/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=2,201,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11466/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,201,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11467/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,201,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11468/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,201,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11469/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=2,202,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11470/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=2,202,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11471/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,202,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11472/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,202,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11473/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=2,202,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11474/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,203,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11475/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,203,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11476/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=2,203,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11477/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=2,203,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11478/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=2,203,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11479/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=2,203,968,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11480/500000]
+ optim/total_grad_norm=1.099
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,204,160,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11481/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,204,352,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11482/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=2,204,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11483/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,204,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11484/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,204,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11485/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,205,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11486/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=2,205,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11487/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,205,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11488/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=2,205,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11489/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,205,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11490/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=2,206,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11491/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=2,206,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11492/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=2,206,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11493/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,206,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11494/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,206,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11495/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,207,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11496/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,207,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11497/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=2,207,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11498/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=2,207,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11499/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=2,207,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11500/500000]
+ optim/total_grad_norm=0.9450
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=2,208,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/05 [12:38:05] INFO | >> Saving config... checkpoint.py:608
+10/05 [12:38:39] INFO | >> Saving model state... checkpoint.py:796
+10/05 [12:39:53] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [12:41:26] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11501/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,208,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11502/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=2,208,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11503/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=2,208,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11504/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=2,208,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11505/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,208,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11506/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=2,209,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11507/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,209,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11508/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=2,209,536,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11509/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,209,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11510/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,209,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11511/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,210,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11512/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=2,210,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11513/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=2,210,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11514/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=2,210,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11515/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,210,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11516/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,211,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11517/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,211,264,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11518/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=2,211,456,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11519/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,211,648,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11520/500000]
+ optim/total_grad_norm=1.074
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,211,840,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11521/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=2,212,032,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11522/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,212,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11523/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=2,212,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11524/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,212,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11525/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,212,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11526/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=2,212,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11527/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,213,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11528/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,213,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11529/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,213,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11530/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=2,213,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11531/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,213,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11532/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,214,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11533/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=2,214,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11534/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=2,214,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11535/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=2,214,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11536/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,214,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11537/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=2,215,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11538/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=2,215,296,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11539/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,215,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11540/500000]
+ optim/total_grad_norm=1.227
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,215,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11541/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=2,215,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11542/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,216,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11543/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,216,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11544/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=2,216,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11545/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,216,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11546/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,216,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11547/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,217,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11548/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,217,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11549/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=2,217,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11550/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,217,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11551/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=2,217,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11552/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,217,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11553/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,218,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11554/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,218,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11555/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,218,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11556/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=2,218,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11557/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,218,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11558/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=2,219,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11559/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=2,219,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11560/500000]
+ optim/total_grad_norm=1.289
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,219,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11561/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,219,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11562/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=2,219,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11563/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=2,220,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11564/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,220,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11565/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=2,220,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11566/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=2,220,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11567/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=2,220,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11568/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,221,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11569/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=2,221,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11570/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=2,221,440,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11571/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=2,221,632,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11572/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=2,221,824,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11573/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=2,222,016,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11574/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=2,222,208,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11575/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=2,222,400,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11576/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=2,222,592,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11577/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=2,222,784,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11578/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=2,222,976,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11579/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,223,168,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11580/500000]
+ optim/total_grad_norm=1.201
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=2,223,360,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11581/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,223,552,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11582/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=2,223,744,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11583/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=2,223,936,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11584/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=2,224,128,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11585/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=2,224,320,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11586/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,224,512,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11587/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,224,704,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11588/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,224,896,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11589/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,225,088,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11590/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=2,225,280,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11591/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,225,472,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11592/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,225,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11593/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=2,225,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11594/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,226,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11595/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,226,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11596/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=2,226,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11597/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,226,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11598/500000]
+ train/ActionNoiseL2Loss=0.1964
+ throughput/total_tokens=2,226,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11599/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,227,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11600/500000]
+ optim/total_grad_norm=1.040
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,227,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11601/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=2,227,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11602/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,227,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11603/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=2,227,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11604/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,227,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11605/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,228,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11606/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=2,228,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11607/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=2,228,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11608/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,228,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11609/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,228,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11610/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,229,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11611/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,229,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11612/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=2,229,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11613/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,229,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11614/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=2,229,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11615/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=2,230,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11616/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,230,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11617/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=2,230,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11618/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,230,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11619/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,230,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11620/500000]
+ optim/total_grad_norm=1.100
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=2,231,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11621/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=2,231,232,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11622/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=2,231,424,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11623/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,231,616,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11624/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,231,808,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11625/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=2,232,000,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11626/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=2,232,192,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11627/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,232,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11628/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=2,232,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11629/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=2,232,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11630/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=2,232,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11631/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,233,152,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11632/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=2,233,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11633/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,233,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11634/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=2,233,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11635/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=2,233,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11636/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=2,234,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11637/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,234,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11638/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,234,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11639/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=2,234,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11640/500000]
+ optim/total_grad_norm=1.322
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=2,234,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11641/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,235,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11642/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,235,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11643/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=2,235,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11644/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=2,235,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11645/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,235,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11646/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,236,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11647/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=2,236,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11648/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,236,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11649/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=2,236,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11650/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,236,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11651/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,236,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11652/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,237,184,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11653/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=2,237,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11654/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,237,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11655/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=2,237,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11656/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,237,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11657/500000]
+ train/ActionNoiseL2Loss=0.1521
+ throughput/total_tokens=2,238,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11658/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=2,238,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11659/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,238,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11660/500000]
+ optim/total_grad_norm=1.249
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,238,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11661/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,238,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11662/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,239,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11663/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=2,239,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11664/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,239,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11665/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,239,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11666/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=2,239,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11667/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=2,240,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11668/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,240,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11669/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=2,240,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11670/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=2,240,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11671/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=2,240,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11672/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=2,241,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11673/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,241,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11674/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=2,241,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11675/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=2,241,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11676/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,241,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11677/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,241,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11678/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=2,242,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11679/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,242,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11680/500000]
+ optim/total_grad_norm=1.068
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,242,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11681/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=2,242,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11682/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,242,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11683/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=2,243,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11684/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,243,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11685/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=2,243,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11686/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,243,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11687/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,243,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11688/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,244,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11689/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,244,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11690/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=2,244,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11691/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=2,244,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11692/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,244,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11693/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=2,245,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11694/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=2,245,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11695/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,245,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11696/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=2,245,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11697/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,245,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11698/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,246,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11699/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=2,246,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11700/500000]
+ optim/total_grad_norm=1.268
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=2,246,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11701/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=2,246,592,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11702/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,246,784,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11703/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,246,976,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11704/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,247,168,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11705/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,247,360,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11706/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=2,247,552,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11707/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,247,744,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11708/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,247,936,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11709/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=2,248,128,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11710/500000]
+ train/ActionNoiseL2Loss=0.1398
+ throughput/total_tokens=2,248,320,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11711/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,248,512,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11712/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=2,248,704,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11713/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,248,896,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11714/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=2,249,088,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11715/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=2,249,280,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11716/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,249,472,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11717/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,249,664,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11718/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,249,856,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11719/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,250,048,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11720/500000]
+ optim/total_grad_norm=0.8932
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=2,250,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11721/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,250,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11722/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=2,250,624,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11723/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,250,816,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11724/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=2,251,008,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11725/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,251,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11726/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=2,251,392,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11727/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,251,584,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11728/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=2,251,776,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11729/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,251,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11730/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,252,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11731/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,252,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11732/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,252,544,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11733/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,252,736,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11734/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=2,252,928,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11735/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=2,253,120,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11736/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,253,312,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11737/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=2,253,504,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11738/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=2,253,696,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11739/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,253,888,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11740/500000]
+ optim/total_grad_norm=1.033
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,254,080,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11741/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=2,254,272,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11742/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=2,254,464,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11743/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,254,656,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11744/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,254,848,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11745/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=2,255,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11746/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,255,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11747/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,255,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11748/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,255,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11749/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,255,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11750/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=2,256,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11751/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,256,192,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11752/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,256,384,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11753/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,256,576,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11754/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,256,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11755/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=2,256,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11756/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,257,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11757/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,257,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11758/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=2,257,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11759/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,257,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11760/500000]
+ optim/total_grad_norm=0.8132
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,257,920,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11761/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=2,258,112,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11762/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=2,258,304,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11763/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,258,496,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11764/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=2,258,688,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11765/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,258,880,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11766/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=2,259,072,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11767/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=2,259,264,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11768/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,259,456,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11769/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=2,259,648,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11770/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,259,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11771/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=2,260,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11772/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,260,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11773/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,260,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11774/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,260,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11775/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,260,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11776/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,260,992,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11777/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=2,261,184,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11778/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,261,376,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11779/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,261,568,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11780/500000]
+ optim/total_grad_norm=0.8225
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=2,261,760,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11781/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=2,261,952,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11782/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=2,262,144,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11783/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,262,336,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11784/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,262,528,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11785/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=2,262,720,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11786/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,262,912,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11787/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=2,263,104,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11788/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,263,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11789/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,263,488,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11790/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=2,263,680,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11791/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,263,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11792/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,264,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11793/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=2,264,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11794/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,264,448,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11795/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=2,264,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11796/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=2,264,832,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11797/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=2,265,024,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11798/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,265,216,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11799/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=2,265,408,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11800/500000]
+ optim/total_grad_norm=1.435
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,265,600,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11801/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,265,792,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11802/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=2,265,984,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11803/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,266,176,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11804/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,266,368,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11805/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=2,266,560,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11806/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,266,752,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11807/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,266,944,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11808/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=2,267,136,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11809/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=2,267,328,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11810/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,267,520,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11811/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=2,267,712,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11812/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,267,904,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11813/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=2,268,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11814/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,268,288,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11815/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=2,268,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11816/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,268,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11817/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,268,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11818/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=2,269,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11819/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,269,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11820/500000]
+ optim/total_grad_norm=0.9549
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=2,269,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11821/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,269,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11822/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,269,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11823/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=2,270,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11824/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,270,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11825/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,270,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11826/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=2,270,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11827/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,270,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11828/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,270,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11829/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,271,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11830/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,271,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11831/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,271,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11832/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=2,271,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11833/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,271,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11834/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,272,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11835/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=2,272,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11836/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,272,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11837/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,272,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11838/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=2,272,896,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11839/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,273,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11840/500000]
+ optim/total_grad_norm=1.013
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=2,273,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11841/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,273,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11842/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,273,664,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11843/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=2,273,856,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11844/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=2,274,048,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11845/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=2,274,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11846/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=2,274,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11847/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,274,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11848/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,274,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11849/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,275,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11850/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=2,275,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11851/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,275,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11852/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,275,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11853/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,275,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11854/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=2,275,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11855/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=2,276,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11856/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=2,276,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11857/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=2,276,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11858/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=2,276,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11859/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=2,276,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11860/500000]
+ optim/total_grad_norm=0.8583
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,277,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11861/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,277,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11862/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=2,277,504,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11863/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,277,696,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11864/500000]
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=2,277,888,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11865/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=2,278,080,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11866/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=2,278,272,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11867/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,278,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11868/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,278,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11869/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=2,278,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11870/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=2,279,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11871/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,279,232,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11872/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,279,424,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11873/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,279,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11874/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,279,808,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11875/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=2,280,000,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11876/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=2,280,192,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11877/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=2,280,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11878/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=2,280,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11879/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,280,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11880/500000]
+ optim/total_grad_norm=0.8304
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,280,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11881/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,281,152,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11882/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,281,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11883/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,281,536,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11884/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=2,281,728,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11885/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=2,281,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11886/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=2,282,112,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11887/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,282,304,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11888/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,282,496,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11889/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=2,282,688,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11890/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=2,282,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11891/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=2,283,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11892/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,283,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11893/500000]
+ train/ActionNoiseL2Loss=0.1656
+ throughput/total_tokens=2,283,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11894/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=2,283,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11895/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=2,283,840,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11896/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,284,032,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11897/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=2,284,224,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11898/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=2,284,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11899/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=2,284,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11900/500000]
+ optim/total_grad_norm=1.037
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,284,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11901/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=2,284,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11902/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,285,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11903/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,285,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11904/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,285,568,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11905/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=2,285,760,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11906/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,285,952,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11907/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,286,144,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11908/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=2,286,336,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11909/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=2,286,528,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11910/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,286,720,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11911/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,286,912,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=11912/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,287,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11913/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,287,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11914/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,287,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11915/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=2,287,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11916/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=2,287,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11917/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=2,288,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11918/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,288,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11919/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=2,288,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11920/500000]
+ optim/total_grad_norm=0.8562
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,288,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11921/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,288,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11922/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=2,289,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11923/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,289,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11924/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,289,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11925/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,289,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11926/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=2,289,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11927/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=2,289,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11928/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,290,176,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11929/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,290,368,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11930/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,290,560,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11931/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,290,752,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11932/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,290,944,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11933/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,291,136,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11934/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=2,291,328,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11935/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=2,291,520,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11936/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,291,712,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11937/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,291,904,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11938/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=2,292,096,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11939/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,292,288,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11940/500000]
+ optim/total_grad_norm=1.126
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,292,480,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11941/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=2,292,672,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11942/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=2,292,864,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11943/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=2,293,056,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11944/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=2,293,248,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11945/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=2,293,440,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11946/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=2,293,632,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11947/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,293,824,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11948/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=2,294,016,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11949/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=2,294,208,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11950/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,294,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11951/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=2,294,592,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11952/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,294,784,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11953/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,294,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11954/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=2,295,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11955/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,295,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11956/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=2,295,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11957/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=2,295,744,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11958/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,295,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11959/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,296,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11960/500000]
+ optim/total_grad_norm=1.102
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,296,320,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11961/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,296,512,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11962/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,296,704,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11963/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=2,296,896,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11964/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,297,088,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11965/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=2,297,280,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11966/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,297,472,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11967/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=2,297,664,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11968/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,297,856,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11969/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=2,298,048,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11970/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,298,240,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=11971/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,298,432,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11972/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,298,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11973/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,298,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11974/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,299,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11975/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=2,299,200,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11976/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=2,299,392,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11977/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,299,584,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11978/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,299,776,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=11979/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=2,299,968,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11980/500000]
+ optim/total_grad_norm=1.146
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,300,160,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11981/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,300,352,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11982/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=2,300,544,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11983/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=2,300,736,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11984/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,300,928,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11985/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,301,120,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11986/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,301,312,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11987/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=2,301,504,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11988/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,301,696,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11989/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=2,301,888,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11990/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,302,080,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=11991/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,302,272,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11992/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=2,302,464,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11993/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=2,302,656,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11994/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,302,848,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11995/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,303,040,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11996/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=2,303,232,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11997/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,303,424,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11998/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=2,303,616,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11999/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,303,808,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=12000/500000]
+ optim/total_grad_norm=1.141
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,304,000,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+10/05 [15:35:02] INFO | >> Saving config... checkpoint.py:608
+10/05 [15:35:51] INFO | >> Saving model state... checkpoint.py:796
+10/05 [15:37:05] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [15:38:38] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=12001/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,304,192,000
+ throughput/device/tokens_per_second=1,197
+ throughput/device/batches_per_second=0.0499
+[step=12002/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,304,384,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12003/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=2,304,576,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12004/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,304,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=12005/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=2,304,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12006/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=2,305,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12007/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,305,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12008/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,305,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12009/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=2,305,728,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12010/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,305,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=12011/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=2,306,112,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12012/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,306,304,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12013/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=2,306,496,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12014/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=2,306,688,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12015/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=2,306,880,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12016/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,307,072,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12017/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=2,307,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12018/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=2,307,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12019/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,307,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12020/500000]
+ optim/total_grad_norm=1.368
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=2,307,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=12021/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,308,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12022/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,308,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12023/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=2,308,416,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12024/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,308,608,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12025/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,308,800,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12026/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,308,992,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12027/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=2,309,184,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12028/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=2,309,376,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12029/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=2,309,568,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12030/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=2,309,760,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=12031/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,309,952,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12032/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=2,310,144,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12033/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=2,310,336,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12034/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=2,310,528,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12035/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=2,310,720,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12036/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,310,912,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12037/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,311,104,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12038/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=2,311,296,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12039/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,311,488,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12040/500000]
+ optim/total_grad_norm=1.047
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,311,680,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=12041/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,311,872,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12042/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,312,064,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12043/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=2,312,256,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12044/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,312,448,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12045/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=2,312,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12046/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,312,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12047/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=2,313,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12048/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,313,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12049/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,313,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12050/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,313,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=12051/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,313,792,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12052/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,313,984,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12053/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=2,314,176,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12054/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,314,368,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12055/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=2,314,560,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12056/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,314,752,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12057/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,314,944,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12058/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,315,136,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12059/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,315,328,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12060/500000]
+ optim/total_grad_norm=1.119
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,315,520,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=12061/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,315,712,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12062/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=2,315,904,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12063/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,316,096,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12064/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,316,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12065/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,316,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12066/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,316,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12067/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=2,316,864,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12068/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,317,056,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12069/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=2,317,248,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12070/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=2,317,440,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=12071/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,317,632,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12072/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,317,824,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12073/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=2,318,016,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12074/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,318,208,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12075/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=2,318,400,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12076/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=2,318,592,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12077/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,318,784,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12078/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=2,318,976,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12079/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,319,168,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12080/500000]
+ optim/total_grad_norm=1.287
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,319,360,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=12081/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,319,552,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12082/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,319,744,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12083/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,319,936,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12084/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=2,320,128,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12085/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,320,320,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12086/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=2,320,512,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12087/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=2,320,704,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12088/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,320,896,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12089/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,321,088,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12090/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=2,321,280,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=12091/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,321,472,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12092/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=2,321,664,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12093/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,321,856,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12094/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=2,322,048,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12095/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=2,322,240,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12096/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=2,322,432,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=12097/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=2,322,624,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12098/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,322,816,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12099/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,323,008,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=12100/500000]
+ optim/total_grad_norm=0.9887
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=2,323,200,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,467
+[step=12101/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=2,323,392,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12102/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=2,323,584,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12103/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=2,323,776,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12104/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,323,968,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12105/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=2,324,160,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12106/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,324,352,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12107/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=2,324,544,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12108/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=2,324,736,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12109/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,324,928,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12110/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,325,120,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=12111/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,325,312,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12112/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,325,504,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12113/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=2,325,696,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12114/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,325,888,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12115/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=2,326,080,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12116/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,326,272,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12117/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=2,326,464,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12118/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=2,326,656,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12119/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,326,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12120/500000]
+ optim/total_grad_norm=1.483
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=2,327,040,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=12121/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,327,232,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12122/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=2,327,424,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12123/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=2,327,616,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12124/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=2,327,808,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12125/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=2,328,000,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12126/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,328,192,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12127/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,328,384,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12128/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,328,576,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12129/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=2,328,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12130/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=2,328,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=12131/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=2,329,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12132/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,329,344,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12133/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,329,536,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12134/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=2,329,728,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12135/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,329,920,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12136/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,330,112,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12137/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,330,304,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12138/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=2,330,496,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12139/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=2,330,688,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12140/500000]
+ optim/total_grad_norm=1.036
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=2,330,880,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=12141/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=2,331,072,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12142/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,331,264,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12143/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,331,456,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12144/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,331,648,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12145/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,331,840,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12146/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=2,332,032,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12147/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=2,332,224,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12148/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=2,332,416,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12149/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,332,608,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12150/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,332,800,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=12151/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=2,332,992,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12152/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=2,333,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12153/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,333,376,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12154/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=2,333,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12155/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,333,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12156/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=2,333,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12157/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,334,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12158/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,334,336,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12159/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=2,334,528,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12160/500000]
+ optim/total_grad_norm=1.324
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=2,334,720,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=12161/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,334,912,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12162/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=2,335,104,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12163/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=2,335,296,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12164/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,335,488,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12165/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,335,680,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12166/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=2,335,872,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12167/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=2,336,064,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12168/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,336,256,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12169/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=2,336,448,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12170/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,336,640,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=12171/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=2,336,832,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12172/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=2,337,024,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12173/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=2,337,216,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12174/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,337,408,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12175/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,337,600,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12176/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,337,792,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12177/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,337,984,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12178/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=2,338,176,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12179/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,338,368,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12180/500000]
+ optim/total_grad_norm=1.040
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,338,560,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
+[step=12181/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,338,752,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12182/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=2,338,944,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12183/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=2,339,136,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12184/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,339,328,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12185/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,339,520,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12186/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=2,339,712,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12187/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,339,904,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12188/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,340,096,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12189/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=2,340,288,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12190/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=2,340,480,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,467
diff --git a/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/requirements.txt b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/requirements.txt
@@ -0,0 +1,286 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+et_xmlfile==2.0.0
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+openpyxl==3.1.5
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/wandb-metadata.json b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..a503c8d4f4518bbe36bf38784d8ceae03c997d4c
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-10-02T16:45:38.216857Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/all_flow_matching",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "1600",
+ "--ft_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "all",
+ "--real_world_vla_config_path",
+ "vla_config_realworld/vla_config_all.yaml",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "5071f59d87c6a976691323cbac66d7a988b0b4e7"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/all_flow_matching/wandb",
+ "host": "auh7-1b-gpu-266",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50483982336"
+ }
+ },
+ "memory": {
+ "total": "2434606915584"
+ },
+ "gpu_amd": [
+ {
+ "id": "6",
+ "uniqueId": "0x38b61e086b79539",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0xdaf8107e479aecf0",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0xef820a5c24b0c740",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0x1633d5497b099b7f",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0xec87d8b9ba4d4aa9",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0x55366988951d07ad",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xe7ce40a1ea1cbac2",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0x433fd00772eb3fb7",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1759682693",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "2295",
+ "job_name": "mh_all_flow_matching",
+ "job_nodelist": "auh7-1b-gpu-266",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1759423493",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "2295",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-266",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "3783754",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-266",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "7sa49miayth30l6v6ockbcw8099vz0ka"
+}
\ No newline at end of file
diff --git a/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/logs/debug-core.log b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..5de21d5172efef40a5496a0f47c935446a9ed078
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/logs/debug-core.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:45:38.273125056Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpn_nk7ft2/port-3783943.txt","pid":3783943,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-10-02T16:45:38.273762256Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3783943}
+{"time":"2025-10-02T16:45:38.273740416Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3783943-3784109-3087380137/socket","Net":"unix"}}
+{"time":"2025-10-02T16:45:38.456958681Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-10-02T16:45:38.46398444Z","level":"INFO","msg":"handleInformInit: received","streamId":"si5wp17t","id":"1(@)"}
+{"time":"2025-10-02T16:45:39.48927839Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"si5wp17t","id":"1(@)"}
diff --git a/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/logs/debug-internal.log b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..46bb34f26df4f2aeb63b46b2f2a8239758de40aa
--- /dev/null
+++ b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/logs/debug-internal.log
@@ -0,0 +1,8 @@
+{"time":"2025-10-02T16:45:38.466053735Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:45:39.489216309Z","level":"INFO","msg":"stream: created new stream","id":"si5wp17t"}
+{"time":"2025-10-02T16:45:39.48927263Z","level":"INFO","msg":"stream: started","id":"si5wp17t"}
+{"time":"2025-10-02T16:45:39.48928615Z","level":"INFO","msg":"writer: started","stream_id":"si5wp17t"}
+{"time":"2025-10-02T16:45:39.48930321Z","level":"INFO","msg":"sender: started","stream_id":"si5wp17t"}
+{"time":"2025-10-02T16:45:39.489330791Z","level":"INFO","msg":"handler: started","stream_id":"si5wp17t"}
+{"time":"2025-10-03T17:19:10.628180203Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/si5wp17t/file_stream","body":"\n\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
+{"time":"2025-10-04T16:32:25.479544416Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"}
diff --git a/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/logs/debug.log b/all_flow_matching/wandb/wandb/run-20251002_164538-si5wp17t/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/all_l1/wandb/wandb/run-20250930_131250-ea1k0g3y/run-ea1k0g3y.wandb b/all_l1/wandb/wandb/run-20250930_131250-ea1k0g3y/run-ea1k0g3y.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..730e289a16be797ed58ad3be83a830a4337f7564
--- /dev/null
+++ b/all_l1/wandb/wandb/run-20250930_131250-ea1k0g3y/run-ea1k0g3y.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:791be076eb565a57764ddeb640381d4fc6a19b9a1220e3542b3004d143a4a24f
+size 287866880
diff --git a/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/run-gqyapbwp.wandb b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/run-gqyapbwp.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..226bd5cdaae19dad1a4ac8d6048ea0570c5f61be
--- /dev/null
+++ b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/run-gqyapbwp.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ad6004c96ed0e1c280e6e41e944c5fd22567170ac3f7070cff7766f01bb175a7
+size 740786176
diff --git a/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/run-yqnt28c8.wandb b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/run-yqnt28c8.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..f5bb4646eaad147af9f2335069840beda7c7ce09
--- /dev/null
+++ b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/run-yqnt28c8.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5fb877b85877c4cb9df37672a07bc6de19d6862d640c4ea0b1786208c76dcae2
+size 730595328
diff --git a/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/run-qzez8pv7.wandb b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/run-qzez8pv7.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..b71af48098db7acb04608e93eb4adcdf47013c43
--- /dev/null
+++ b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/run-qzez8pv7.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:31c1aadb6c784bb4711d0c302fd54eec2975996ade110400a6237d4116f8f1a6
+size 406847488
diff --git a/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/run-7ovz4jzt.wandb b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/run-7ovz4jzt.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..5eb3ddb6f6d4040181139f4cd851cc60fa4d256d
--- /dev/null
+++ b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/run-7ovz4jzt.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7b6cf3cbe7165c1da71c7a456b369621d14ccf90e651d601297a081798b2078
+size 409206784
diff --git a/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/run-a381qnn9.wandb b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/run-a381qnn9.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..7c0a057abff7af93389fea608a7c4630eb665343
--- /dev/null
+++ b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/run-a381qnn9.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0ad952c5053dca5cb28171a15167df83ec11fbf4a60f8da6e23d3547a644bb19
+size 731709440
diff --git a/wipe_flow_matching/wandb/wandb/run-20251005_163812-0cfqmuqw/run-0cfqmuqw.wandb b/wipe_flow_matching/wandb/wandb/run-20251005_163812-0cfqmuqw/run-0cfqmuqw.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..0a4e92718f897580cd9bf18a47aecc4a331d7e4f
--- /dev/null
+++ b/wipe_flow_matching/wandb/wandb/run-20251005_163812-0cfqmuqw/run-0cfqmuqw.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6ea072dfff83501ee9c6d74cf4428b1579486d4d84fdba9f0fed27b0d2cfd507
+size 738361344